pandaphd commited on
Commit
f834ec5
·
1 Parent(s): 3081400

weights and unet_merged

Browse files
README.md CHANGED
@@ -1,3 +1,41 @@
1
  ---
2
  license: cc-by-nc-nd-4.0
 
 
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: cc-by-nc-nd-4.0
3
+ language:
4
+ - en
5
+ pipeline_tag: text-to-video
6
+ tags:
7
+ - video generation
8
+ - image generation
9
  ---
10
+ # Generative Photography
11
+
12
+
13
+ <p align="center">
14
+ &nbsp&nbsp <a href="https://generative-photography.github.io/project/">Project Page</a> &nbsp&nbsp| &nbsp&nbsp <a href="https://arxiv.org/abs/2412.02168">Paper</a> &nbsp&nbsp| &nbsp&nbsp <a href="https://github.com/pandayuanyu/generative-photography">Github</a>&nbsp&nbsp
15
+ <br>
16
+ -----
17
+
18
+ [**Generative Photography: Scene-Consistent Camera Control for
19
+ Realistic Text-to-Image Synthesis**]("") <be>
20
+
21
+ In this repository, we present **Generative Photography**, a
22
+ new
23
+
24
+ ## 🔥 Latest News!!
25
+
26
+ * March 3, 2025: Release offical code and pre-trained weights.
27
+ * Feb 26, 2025: Paper is accepted by CVPR 2025!
28
+ * Dec 20, 2024: Release dataset.
29
+
30
+
31
+ ## Citation
32
+ If you find our work helpful, please cite us.
33
+ ```bibtex
34
+ @article{Yuan_2024_GenPhoto,
35
+ title={Generative Photography: Scene-Consistent Camera Control for Realistic Text-to-Image Synthesis},
36
+ author={Yuan, Yu and Wang, Xijun and Sheng, Yichen and Chennuri, Prateek and Zhang, Xingguang and Chan, Stanley},
37
+ journal={CVPR},
38
+ year={2025}
39
+ }
40
+ ```
41
+
unet_merged/config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.6.0",
4
+ "act_fn": "silu",
5
+ "attention_head_dim": 8,
6
+ "block_out_channels": [
7
+ 320,
8
+ 640,
9
+ 1280,
10
+ 1280
11
+ ],
12
+ "center_input_sample": false,
13
+ "cross_attention_dim": 768,
14
+ "down_block_types": [
15
+ "CrossAttnDownBlock2D",
16
+ "CrossAttnDownBlock2D",
17
+ "CrossAttnDownBlock2D",
18
+ "DownBlock2D"
19
+ ],
20
+ "downsample_padding": 1,
21
+ "flip_sin_to_cos": true,
22
+ "freq_shift": 0,
23
+ "in_channels": 4,
24
+ "layers_per_block": 2,
25
+ "mid_block_scale_factor": 1,
26
+ "norm_eps": 1e-05,
27
+ "norm_num_groups": 32,
28
+ "out_channels": 4,
29
+ "sample_size": 64,
30
+ "up_block_types": [
31
+ "UpBlock2D",
32
+ "CrossAttnUpBlock2D",
33
+ "CrossAttnUpBlock2D",
34
+ "CrossAttnUpBlock2D"
35
+ ]
36
+ }
unet_merged/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:271d13f0e7799e4fc96b45c91fa7c54fdd67b99ff53bf30b7dbc9ef1c9eac279
3
+ size 3438167504
unet_merged/diffusion_pytorch_model.safetensors.baiduyun.uploading.cfg ADDED
Binary file (85.2 kB). View file
 
weights/RealEstate10K_LoRA.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:798b894092f96d2d141a4932546eeb19cc60955ba69456921649e6efe34e2554
3
+ size 1156140341
weights/checkpoint-bokehK.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaf405f1c9799557e9b4ecc2b80b53cde56055ed78c0e27c55c341c74c5d375a
3
+ size 2619385373
weights/checkpoint-color_temperature.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a82f87d79dbd7236abdd8a9aa7cd25e47044739f899846b183a13fa10dd41501
3
+ size 2619385373
weights/checkpoint-focal_length.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f756e0dcdaeefc869bf39ffdb1b73ec5523b800437185f0a310fa68182c35e1
3
+ size 2619385373
weights/checkpoint-shutter_speed.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fad5584cfd1595d6196125b90861ab2d2ee0db962df38a88344be8282fdb11a
3
+ size 2619385373
weights/v3_sd15_mm.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2412711886f61091846f53204aabc38aa6e09356d62a9808abe4daa802168343
3
+ size 1673262583