weights and unet_merged
Browse files- README.md +38 -0
- unet_merged/config.json +36 -0
- unet_merged/diffusion_pytorch_model.safetensors +3 -0
- unet_merged/diffusion_pytorch_model.safetensors.baiduyun.uploading.cfg +0 -0
- weights/RealEstate10K_LoRA.ckpt +3 -0
- weights/checkpoint-bokehK.ckpt +3 -0
- weights/checkpoint-color_temperature.ckpt +3 -0
- weights/checkpoint-focal_length.ckpt +3 -0
- weights/checkpoint-shutter_speed.ckpt +3 -0
- weights/v3_sd15_mm.ckpt +3 -0
README.md
CHANGED
@@ -1,3 +1,41 @@
|
|
1 |
---
|
2 |
license: cc-by-nc-nd-4.0
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
---
|
2 |
license: cc-by-nc-nd-4.0
|
3 |
+
language:
|
4 |
+
- en
|
5 |
+
pipeline_tag: text-to-video
|
6 |
+
tags:
|
7 |
+
- video generation
|
8 |
+
- image generation
|
9 |
---
|
10 |
+
# Generative Photography
|
11 |
+
|
12 |
+
|
13 |
+
<p align="center">
|
14 |
+
   <a href="https://generative-photography.github.io/project/">Project Page</a>   |    <a href="https://arxiv.org/abs/2412.02168">Paper</a>   |    <a href="https://github.com/pandayuanyu/generative-photography">Github</a>  
|
15 |
+
<br>
|
16 |
+
-----
|
17 |
+
|
18 |
+
[**Generative Photography: Scene-Consistent Camera Control for
|
19 |
+
Realistic Text-to-Image Synthesis**]("") <be>
|
20 |
+
|
21 |
+
In this repository, we present **Generative Photography**, a
|
22 |
+
new
|
23 |
+
|
24 |
+
## 🔥 Latest News!!
|
25 |
+
|
26 |
+
* March 3, 2025: Release offical code and pre-trained weights.
|
27 |
+
* Feb 26, 2025: Paper is accepted by CVPR 2025!
|
28 |
+
* Dec 20, 2024: Release dataset.
|
29 |
+
|
30 |
+
|
31 |
+
## Citation
|
32 |
+
If you find our work helpful, please cite us.
|
33 |
+
```bibtex
|
34 |
+
@article{Yuan_2024_GenPhoto,
|
35 |
+
title={Generative Photography: Scene-Consistent Camera Control for Realistic Text-to-Image Synthesis},
|
36 |
+
author={Yuan, Yu and Wang, Xijun and Sheng, Yichen and Chennuri, Prateek and Zhang, Xingguang and Chan, Stanley},
|
37 |
+
journal={CVPR},
|
38 |
+
year={2025}
|
39 |
+
}
|
40 |
+
```
|
41 |
+
|
unet_merged/config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.6.0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"attention_head_dim": 8,
|
6 |
+
"block_out_channels": [
|
7 |
+
320,
|
8 |
+
640,
|
9 |
+
1280,
|
10 |
+
1280
|
11 |
+
],
|
12 |
+
"center_input_sample": false,
|
13 |
+
"cross_attention_dim": 768,
|
14 |
+
"down_block_types": [
|
15 |
+
"CrossAttnDownBlock2D",
|
16 |
+
"CrossAttnDownBlock2D",
|
17 |
+
"CrossAttnDownBlock2D",
|
18 |
+
"DownBlock2D"
|
19 |
+
],
|
20 |
+
"downsample_padding": 1,
|
21 |
+
"flip_sin_to_cos": true,
|
22 |
+
"freq_shift": 0,
|
23 |
+
"in_channels": 4,
|
24 |
+
"layers_per_block": 2,
|
25 |
+
"mid_block_scale_factor": 1,
|
26 |
+
"norm_eps": 1e-05,
|
27 |
+
"norm_num_groups": 32,
|
28 |
+
"out_channels": 4,
|
29 |
+
"sample_size": 64,
|
30 |
+
"up_block_types": [
|
31 |
+
"UpBlock2D",
|
32 |
+
"CrossAttnUpBlock2D",
|
33 |
+
"CrossAttnUpBlock2D",
|
34 |
+
"CrossAttnUpBlock2D"
|
35 |
+
]
|
36 |
+
}
|
unet_merged/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:271d13f0e7799e4fc96b45c91fa7c54fdd67b99ff53bf30b7dbc9ef1c9eac279
|
3 |
+
size 3438167504
|
unet_merged/diffusion_pytorch_model.safetensors.baiduyun.uploading.cfg
ADDED
Binary file (85.2 kB). View file
|
|
weights/RealEstate10K_LoRA.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:798b894092f96d2d141a4932546eeb19cc60955ba69456921649e6efe34e2554
|
3 |
+
size 1156140341
|
weights/checkpoint-bokehK.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaf405f1c9799557e9b4ecc2b80b53cde56055ed78c0e27c55c341c74c5d375a
|
3 |
+
size 2619385373
|
weights/checkpoint-color_temperature.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a82f87d79dbd7236abdd8a9aa7cd25e47044739f899846b183a13fa10dd41501
|
3 |
+
size 2619385373
|
weights/checkpoint-focal_length.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f756e0dcdaeefc869bf39ffdb1b73ec5523b800437185f0a310fa68182c35e1
|
3 |
+
size 2619385373
|
weights/checkpoint-shutter_speed.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fad5584cfd1595d6196125b90861ab2d2ee0db962df38a88344be8282fdb11a
|
3 |
+
size 2619385373
|
weights/v3_sd15_mm.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2412711886f61091846f53204aabc38aa6e09356d62a9808abe4daa802168343
|
3 |
+
size 1673262583
|