AACEE commited on
Commit
754f79a
·
1 Parent(s): cf849bf

End of training

Browse files
Files changed (40) hide show
  1. README.md +2 -2
  2. checkpoint-1000/optimizer.bin +2 -2
  3. checkpoint-1000/pytorch_model.bin +2 -2
  4. checkpoint-1000/random_states_0.pkl +1 -1
  5. checkpoint-1500/optimizer.bin +2 -2
  6. checkpoint-1500/pytorch_model.bin +2 -2
  7. checkpoint-1500/random_states_0.pkl +2 -2
  8. checkpoint-2000/optimizer.bin +2 -2
  9. checkpoint-2000/pytorch_model.bin +2 -2
  10. checkpoint-2000/random_states_0.pkl +1 -1
  11. checkpoint-2500/optimizer.bin +2 -2
  12. checkpoint-2500/pytorch_model.bin +2 -2
  13. checkpoint-2500/random_states_0.pkl +2 -2
  14. checkpoint-3000/optimizer.bin +2 -2
  15. checkpoint-3000/pytorch_model.bin +2 -2
  16. checkpoint-3000/random_states_0.pkl +1 -1
  17. checkpoint-500/optimizer.bin +2 -2
  18. checkpoint-500/pytorch_model.bin +2 -2
  19. checkpoint-500/random_states_0.pkl +1 -1
  20. feature_extractor/preprocessor_config.json +16 -12
  21. learned_embeds-steps-1000.bin +2 -2
  22. learned_embeds-steps-1500.bin +2 -2
  23. learned_embeds-steps-2000.bin +2 -2
  24. learned_embeds-steps-2500.bin +2 -2
  25. learned_embeds-steps-3000.bin +2 -2
  26. learned_embeds-steps-500.bin +2 -2
  27. learned_embeds.bin +2 -2
  28. logs/textual_inversion/1689107596.745057/events.out.tfevents.1689107596.p4de-st-p4de24xlarge-564.3414741.1 +3 -0
  29. logs/textual_inversion/1689107596.7586236/hparams.yml +46 -0
  30. logs/textual_inversion/events.out.tfevents.1689107596.p4de-st-p4de24xlarge-564.3414741.0 +3 -0
  31. model_index.json +3 -3
  32. safety_checker/config.json +168 -0
  33. safety_checker/pytorch_model.bin +3 -0
  34. text_encoder/config.json +7 -7
  35. text_encoder/pytorch_model.bin +2 -2
  36. tokenizer/special_tokens_map.json +1 -1
  37. unet/config.json +6 -11
  38. unet/diffusion_pytorch_model.bin +2 -2
  39. vae/config.json +2 -2
  40. vae/diffusion_pytorch_model.bin +1 -1
README.md CHANGED
@@ -1,7 +1,7 @@
1
 
2
  ---
3
  license: creativeml-openrail-m
4
- base_model: stabilityai/stable-diffusion-2-depth
5
  tags:
6
  - stable-diffusion
7
  - stable-diffusion-diffusers
@@ -12,6 +12,6 @@ inference: true
12
  ---
13
 
14
  # Textual inversion text2image fine-tuning - AACEE/textual_inversion_cat
15
- These are textual inversion adaption weights for stabilityai/stable-diffusion-2-depth. You can find some example images in the following.
16
 
17
 
 
1
 
2
  ---
3
  license: creativeml-openrail-m
4
+ base_model: runwayml/stable-diffusion-v1-5
5
  tags:
6
  - stable-diffusion
7
  - stable-diffusion-diffusers
 
12
  ---
13
 
14
  # Textual inversion text2image fine-tuning - AACEE/textual_inversion_cat
15
+ These are textual inversion adaption weights for runwayml/stable-diffusion-v1-5. You can find some example images in the following.
16
 
17
 
checkpoint-1000/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f86107b4fae79babbda76a4f1f28f0871fe74061b6505ca87376b5815a43e793
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:351260f9eb6c37331bb93da4b923f31019d967d148cddfc62ef789b72954b2f1
3
+ size 303570477
checkpoint-1000/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f5c3a29639ba45e9cea80e829cb9e442f4b059a5033d9abbbefdc3234a4bfe7
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe1e0e9d12a24a0019693fe8790beef23c239b7edd1875004cdc9f38346ba1a
3
+ size 492322337
checkpoint-1000/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88f3bb4d20d1d2e810e3d88154f83592d8ff470e0a6db2f699f4663fea4ba8fd
3
  size 14663
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d04ca35edc3dac6f0ff0e7d1e6ce7d6abfb4632dc1380d6d1fb38d1f71e174b
3
  size 14663
checkpoint-1500/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5433aff1ae19cffcfb35c4ce0d9e6038fced4350f3fe109998a969bedef7b8f
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ebaf5197d3c7bbb6f4a165003ca16dc7bf30186f5cc2437b8eae23b49d0758b
3
+ size 303570477
checkpoint-1500/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81bb851115dc65c73cbd2a4c30baec1a92efeae22931204aeb929af8257ac2ff
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb5b2b01c3c8c84b515092139e18aa7be2f6615d53505783cef9a4eb6ad19ddf
3
+ size 492322337
checkpoint-1500/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2eb603eeb1ffbdf46ca43ad8cd7af0d588867c15334ec708a756177883184837
3
- size 14663
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ab04c972b749c68cedd2a6fd9d6a1dd2a3353065765360cfb802ab298f84d5d
3
+ size 14727
checkpoint-2000/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e47e26afdd664980dc8c3b3c7e22f49606e6505bcc24479bc6f9bfa39b0d08a
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:421563e73a9e470eabb6f7877cb0a45817116607c001eed744b8b10851698221
3
+ size 303570477
checkpoint-2000/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d25d8b63c506d2c289849c7921e481c3c2b001413794ebb94693f706651f6a3
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd91ff223221672b82f568b2e3059c68462545264d528ff64efba81da6b759b9
3
+ size 492322337
checkpoint-2000/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09024fcad3c189f1565aed8dc000207537b737c972bd54b6da0b21e114126e66
3
  size 14663
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ecab6d2acd5606f567fda54d15453618b2abddb038aa49cefe22b0291e77217
3
  size 14663
checkpoint-2500/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a035b7cbc9fa0465daf98dbff4522d762e7dc9f5868ff73d1dd69e3ce85b217
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0fa1259f49efd84d1c2dd56633d4f2cf20f5fe42aa3d6d39e888ab86894e34a
3
+ size 303570477
checkpoint-2500/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae23aeb245d00a4cd115f7d0eec3b6bc93742defa8a94dedb9e72fd861cc87dc
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8734d41b742d86d32569fdbb8da2f92353647fc9d612671f5bbd8b3f57780fd
3
+ size 492322337
checkpoint-2500/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f088557d2036ef06daf20def625f4b7c9026d9cac4b17eed2db5cd9830595fce
3
- size 14727
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dc0d16b7010dc42ce5c93c096adc4ead54e6b0f1464f5270a2f19e9fb448709
3
+ size 14663
checkpoint-3000/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:609e7e77fb6906c9504c2195c6d819ffbc08f591f827ae1b998eb70f5d124e94
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fe173af645c8c2c2862f13333d1d98c5ddb347a5913b65614cb1a357ae72499
3
+ size 303570477
checkpoint-3000/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72dfe01f47cf61ec0c0ff81ff7327cc9d224181f8cb8eaa9c06f850f56deda88
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d175faa3f1c86a0a7b62cfd79d9a9017dc6ea61b9fecc632e9a9a8bfb1896a
3
+ size 492322337
checkpoint-3000/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f04b250949009e36eb1b4f73a9c82a2a60986bd58753c7dc302395e3eb62f78a
3
  size 14727
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a82bc1e1947519d800c1f320658d46afda7bf0a26d0343f28cfa87187dd8fc13
3
  size 14727
checkpoint-500/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ba32327b0d5a791fcdb66ccc879fee4f3be13bf250b92929f59b240cd5d65ad
3
- size 404760109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec90a82888971b2e52bb87f2159f6c9b118b5d6e4b4326ead303a73bfba27f3
3
+ size 303570477
checkpoint-500/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5254d8bfbf746625a2635ae9e4bbde62c8522450b94fc8c79c6a5f43a931b799
3
- size 1361701921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfb0b9705f781a508523f48be8dcb685e03eaac67ddcd358942e05b25e6e13b8
3
+ size 492322337
checkpoint-500/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca9d7278da13f4ad233aea006bf58d2980d264f7e42a4965459c92f8f95ad27e
3
  size 14663
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b605ad814bed7e0ba6347aa0fcdf330c324a5d95a70c92710b7430e39aa580c
3
  size 14663
feature_extractor/preprocessor_config.json CHANGED
@@ -1,24 +1,28 @@
1
  {
 
 
 
 
 
 
2
  "do_normalize": true,
3
  "do_rescale": true,
4
  "do_resize": true,
5
- "ensure_multiple_of": 1,
6
  "image_mean": [
7
- 0.5,
8
- 0.5,
9
- 0.5
10
  ],
11
- "image_processor_type": "DPTImageProcessor",
12
  "image_std": [
13
- 0.5,
14
- 0.5,
15
- 0.5
16
  ],
17
- "keep_aspect_ratio": false,
18
- "resample": 2,
19
  "rescale_factor": 0.00392156862745098,
20
  "size": {
21
- "height": 384,
22
- "width": 384
23
  }
24
  }
 
1
  {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
  "do_normalize": true,
9
  "do_rescale": true,
10
  "do_resize": true,
11
+ "feature_extractor_type": "CLIPFeatureExtractor",
12
  "image_mean": [
13
+ 0.48145466,
14
+ 0.4578275,
15
+ 0.40821073
16
  ],
17
+ "image_processor_type": "CLIPImageProcessor",
18
  "image_std": [
19
+ 0.26862954,
20
+ 0.26130258,
21
+ 0.27577711
22
  ],
23
+ "resample": 3,
 
24
  "rescale_factor": 0.00392156862745098,
25
  "size": {
26
+ "shortest_edge": 224
 
27
  }
28
  }
learned_embeds-steps-1000.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71eec6a979cde290edab32752c97eea135e8bb560ced2f6e5470c917cdea6b16
3
- size 5025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e3bfc7f75c1b62d8343b31a8c749d0e2fbff20fae548970b5a195524d558ddf
3
+ size 4001
learned_embeds-steps-1500.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96a24ad42e46a9c1e283834f3bc3c4c4b00319fab8ee99a259aaf681f1a93caf
3
- size 5025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a748badcfca34e770012d55d9532e6e490e414cd7f4a49d8889540d3320b9655
3
+ size 4001
learned_embeds-steps-2000.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a97333e59cc70bcec2a16b6987991dedbf723e1240844ec951a1d0912a1e18fe
3
- size 5025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d45604154ae99357b5808c7fe99ae8a4a6e5ef4e032d0c34c8e45c0a87de2c8d
3
+ size 4001
learned_embeds-steps-2500.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb9a5e491b784d75e03f936aac03ccb047a247a1c8eb1a5e7818433bfa1b956f
3
- size 5025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5fdda7de54b9629579e69a009e4800248edb03f98cc4db011fe3c2fbe753276
3
+ size 4001
learned_embeds-steps-3000.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5228ad0effeb42c5b1276e7a0abf979d79444979ececa432eedb31ec9e34ebec
3
- size 5025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce8b54f9440a566f570137ffdd4cc2a9646cf53dc5ef65de4be96355401d9f6
3
+ size 4001
learned_embeds-steps-500.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d41dd636426fcad891e9890d89f17900e0e4ab6d46e756ca9959e2ef9e239bb
3
- size 5022
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83da42705a3c6a99f5a62c15ffaa5a92569d8dfe8f7ed0f4ee59c5431318fac8
3
+ size 3998
learned_embeds.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b83d87d8cd415a974691112b178320823fceb0e33c63ac8ad7cdf4b6bc4738a
3
- size 4864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b942244a753c8029b2b307b3bc320aadbf4409d3132ad7737a86f9a02f29af18
3
+ size 3840
logs/textual_inversion/1689107596.745057/events.out.tfevents.1689107596.p4de-st-p4de24xlarge-564.3414741.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ae232439c86bc6b38dff25a050eb997239725a1aaf56c9d890c8dc725f89132
3
+ size 2260
logs/textual_inversion/1689107596.7586236/hparams.yml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ dataloader_num_workers: 0
10
+ enable_xformers_memory_efficient_attention: false
11
+ gradient_accumulation_steps: 4
12
+ gradient_checkpointing: false
13
+ hub_model_id: null
14
+ hub_token: null
15
+ initializer_token: toy
16
+ learnable_property: object
17
+ learning_rate: 0.002
18
+ local_rank: -1
19
+ logging_dir: logs
20
+ lr_num_cycles: 1
21
+ lr_scheduler: constant
22
+ lr_warmup_steps: 0
23
+ max_train_steps: 3000
24
+ mixed_precision: 'no'
25
+ num_train_epochs: 20
26
+ num_validation_images: 4
27
+ num_vectors: 1
28
+ output_dir: textual_inversion_cat
29
+ placeholder_token: <cat-toy>
30
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
31
+ push_to_hub: true
32
+ repeats: 100
33
+ report_to: tensorboard
34
+ resolution: 512
35
+ resume_from_checkpoint: null
36
+ revision: null
37
+ save_as_full_pipeline: false
38
+ save_steps: 500
39
+ scale_lr: true
40
+ seed: null
41
+ tokenizer_name: null
42
+ train_batch_size: 1
43
+ train_data_dir: ./cat
44
+ validation_epochs: null
45
+ validation_prompt: null
46
+ validation_steps: 100
logs/textual_inversion/events.out.tfevents.1689107596.p4de-st-p4de24xlarge-564.3414741.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a927eb916203cfe3636aa102fb753ea9baa81b96cacf37ca94e885681a0a095
3
+ size 1007054
model_index.json CHANGED
@@ -3,12 +3,12 @@
3
  "_diffusers_version": "0.18.1",
4
  "feature_extractor": [
5
  "transformers",
6
- "DPTImageProcessor"
7
  ],
8
  "requires_safety_checker": true,
9
  "safety_checker": [
10
- null,
11
- null
12
  ],
13
  "scheduler": [
14
  "diffusers",
 
3
  "_diffusers_version": "0.18.1",
4
  "feature_extractor": [
5
  "transformers",
6
+ "CLIPImageProcessor"
7
  ],
8
  "requires_safety_checker": true,
9
  "safety_checker": [
10
+ "stable_diffusion",
11
+ "StableDiffusionSafetyChecker"
12
  ],
13
  "scheduler": [
14
  "diffusers",
safety_checker/config.json ADDED
@@ -0,0 +1,168 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_commit_hash": "c9ab35ff5f2c362e9e22fbafe278077e196057f0",
3
+ "_name_or_path": "/data/home/ancao/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/c9ab35ff5f2c362e9e22fbafe278077e196057f0/safety_checker",
4
+ "architectures": [
5
+ "StableDiffusionSafetyChecker"
6
+ ],
7
+ "initializer_factor": 1.0,
8
+ "logit_scale_init_value": 2.6592,
9
+ "model_type": "clip",
10
+ "projection_dim": 768,
11
+ "text_config": {
12
+ "_name_or_path": "",
13
+ "add_cross_attention": false,
14
+ "architectures": null,
15
+ "attention_dropout": 0.0,
16
+ "bad_words_ids": null,
17
+ "begin_suppress_tokens": null,
18
+ "bos_token_id": 0,
19
+ "chunk_size_feed_forward": 0,
20
+ "cross_attention_hidden_size": null,
21
+ "decoder_start_token_id": null,
22
+ "diversity_penalty": 0.0,
23
+ "do_sample": false,
24
+ "dropout": 0.0,
25
+ "early_stopping": false,
26
+ "encoder_no_repeat_ngram_size": 0,
27
+ "eos_token_id": 2,
28
+ "exponential_decay_length_penalty": null,
29
+ "finetuning_task": null,
30
+ "forced_bos_token_id": null,
31
+ "forced_eos_token_id": null,
32
+ "hidden_act": "quick_gelu",
33
+ "hidden_size": 768,
34
+ "id2label": {
35
+ "0": "LABEL_0",
36
+ "1": "LABEL_1"
37
+ },
38
+ "initializer_factor": 1.0,
39
+ "initializer_range": 0.02,
40
+ "intermediate_size": 3072,
41
+ "is_decoder": false,
42
+ "is_encoder_decoder": false,
43
+ "label2id": {
44
+ "LABEL_0": 0,
45
+ "LABEL_1": 1
46
+ },
47
+ "layer_norm_eps": 1e-05,
48
+ "length_penalty": 1.0,
49
+ "max_length": 20,
50
+ "max_position_embeddings": 77,
51
+ "min_length": 0,
52
+ "model_type": "clip_text_model",
53
+ "no_repeat_ngram_size": 0,
54
+ "num_attention_heads": 12,
55
+ "num_beam_groups": 1,
56
+ "num_beams": 1,
57
+ "num_hidden_layers": 12,
58
+ "num_return_sequences": 1,
59
+ "output_attentions": false,
60
+ "output_hidden_states": false,
61
+ "output_scores": false,
62
+ "pad_token_id": 1,
63
+ "prefix": null,
64
+ "problem_type": null,
65
+ "projection_dim": 512,
66
+ "pruned_heads": {},
67
+ "remove_invalid_values": false,
68
+ "repetition_penalty": 1.0,
69
+ "return_dict": true,
70
+ "return_dict_in_generate": false,
71
+ "sep_token_id": null,
72
+ "suppress_tokens": null,
73
+ "task_specific_params": null,
74
+ "temperature": 1.0,
75
+ "tf_legacy_loss": false,
76
+ "tie_encoder_decoder": false,
77
+ "tie_word_embeddings": true,
78
+ "tokenizer_class": null,
79
+ "top_k": 50,
80
+ "top_p": 1.0,
81
+ "torch_dtype": null,
82
+ "torchscript": false,
83
+ "transformers_version": "4.30.2",
84
+ "typical_p": 1.0,
85
+ "use_bfloat16": false,
86
+ "vocab_size": 49408
87
+ },
88
+ "torch_dtype": "float32",
89
+ "transformers_version": null,
90
+ "vision_config": {
91
+ "_name_or_path": "",
92
+ "add_cross_attention": false,
93
+ "architectures": null,
94
+ "attention_dropout": 0.0,
95
+ "bad_words_ids": null,
96
+ "begin_suppress_tokens": null,
97
+ "bos_token_id": null,
98
+ "chunk_size_feed_forward": 0,
99
+ "cross_attention_hidden_size": null,
100
+ "decoder_start_token_id": null,
101
+ "diversity_penalty": 0.0,
102
+ "do_sample": false,
103
+ "dropout": 0.0,
104
+ "early_stopping": false,
105
+ "encoder_no_repeat_ngram_size": 0,
106
+ "eos_token_id": null,
107
+ "exponential_decay_length_penalty": null,
108
+ "finetuning_task": null,
109
+ "forced_bos_token_id": null,
110
+ "forced_eos_token_id": null,
111
+ "hidden_act": "quick_gelu",
112
+ "hidden_size": 1024,
113
+ "id2label": {
114
+ "0": "LABEL_0",
115
+ "1": "LABEL_1"
116
+ },
117
+ "image_size": 224,
118
+ "initializer_factor": 1.0,
119
+ "initializer_range": 0.02,
120
+ "intermediate_size": 4096,
121
+ "is_decoder": false,
122
+ "is_encoder_decoder": false,
123
+ "label2id": {
124
+ "LABEL_0": 0,
125
+ "LABEL_1": 1
126
+ },
127
+ "layer_norm_eps": 1e-05,
128
+ "length_penalty": 1.0,
129
+ "max_length": 20,
130
+ "min_length": 0,
131
+ "model_type": "clip_vision_model",
132
+ "no_repeat_ngram_size": 0,
133
+ "num_attention_heads": 16,
134
+ "num_beam_groups": 1,
135
+ "num_beams": 1,
136
+ "num_channels": 3,
137
+ "num_hidden_layers": 24,
138
+ "num_return_sequences": 1,
139
+ "output_attentions": false,
140
+ "output_hidden_states": false,
141
+ "output_scores": false,
142
+ "pad_token_id": null,
143
+ "patch_size": 14,
144
+ "prefix": null,
145
+ "problem_type": null,
146
+ "projection_dim": 512,
147
+ "pruned_heads": {},
148
+ "remove_invalid_values": false,
149
+ "repetition_penalty": 1.0,
150
+ "return_dict": true,
151
+ "return_dict_in_generate": false,
152
+ "sep_token_id": null,
153
+ "suppress_tokens": null,
154
+ "task_specific_params": null,
155
+ "temperature": 1.0,
156
+ "tf_legacy_loss": false,
157
+ "tie_encoder_decoder": false,
158
+ "tie_word_embeddings": true,
159
+ "tokenizer_class": null,
160
+ "top_k": 50,
161
+ "top_p": 1.0,
162
+ "torch_dtype": null,
163
+ "torchscript": false,
164
+ "transformers_version": "4.30.2",
165
+ "typical_p": 1.0,
166
+ "use_bfloat16": false
167
+ }
168
+ }
safety_checker/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16d28f2b37109f222cdc33620fdd262102ac32112be0352a7f77e9614b35a394
3
+ size 1216064769
text_encoder/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "stabilityai/stable-diffusion-2-depth",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -7,18 +7,18 @@
7
  "bos_token_id": 0,
8
  "dropout": 0.0,
9
  "eos_token_id": 2,
10
- "hidden_act": "gelu",
11
- "hidden_size": 1024,
12
  "initializer_factor": 1.0,
13
  "initializer_range": 0.02,
14
- "intermediate_size": 4096,
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 77,
17
  "model_type": "clip_text_model",
18
- "num_attention_heads": 16,
19
- "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
- "projection_dim": 512,
22
  "torch_dtype": "float32",
23
  "transformers_version": "4.30.2",
24
  "vocab_size": 49409
 
1
  {
2
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
 
7
  "bos_token_id": 0,
8
  "dropout": 0.0,
9
  "eos_token_id": 2,
10
+ "hidden_act": "quick_gelu",
11
+ "hidden_size": 768,
12
  "initializer_factor": 1.0,
13
  "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 77,
17
  "model_type": "clip_text_model",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
+ "projection_dim": 768,
22
  "torch_dtype": "float32",
23
  "transformers_version": "4.30.2",
24
  "vocab_size": 49409
text_encoder/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c0b6afab6fdb9ecef989a674eb2d4a23f31ca6115c0583d1b6b1ec3e8af53ee
3
- size 1361684001
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17f5de19a430ba6a420445ac5fd5c9a59804da12f68bfaff3a6aa7a6056e9bdb
3
+ size 492312865
tokenizer/special_tokens_map.json CHANGED
@@ -13,7 +13,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "!",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "<|endoftext|>",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
unet/config.json CHANGED
@@ -1,17 +1,12 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.1",
4
- "_name_or_path": "stabilityai/stable-diffusion-2-depth",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
  "addition_time_embed_dim": null,
9
- "attention_head_dim": [
10
- 5,
11
- 10,
12
- 20,
13
- 20
14
- ],
15
  "block_out_channels": [
16
  320,
17
  640,
@@ -23,7 +18,7 @@
23
  "class_embeddings_concat": false,
24
  "conv_in_kernel": 3,
25
  "conv_out_kernel": 3,
26
- "cross_attention_dim": 1024,
27
  "cross_attention_norm": null,
28
  "down_block_types": [
29
  "CrossAttnDownBlock2D",
@@ -37,7 +32,7 @@
37
  "encoder_hid_dim_type": null,
38
  "flip_sin_to_cos": true,
39
  "freq_shift": 0,
40
- "in_channels": 5,
41
  "layers_per_block": 2,
42
  "mid_block_only_cross_attention": null,
43
  "mid_block_scale_factor": 1,
@@ -52,7 +47,7 @@
52
  "resnet_out_scale_factor": 1.0,
53
  "resnet_skip_time_act": false,
54
  "resnet_time_scale_shift": "default",
55
- "sample_size": 32,
56
  "time_cond_proj_dim": null,
57
  "time_embedding_act_fn": null,
58
  "time_embedding_dim": null,
@@ -66,5 +61,5 @@
66
  "CrossAttnUpBlock2D"
67
  ],
68
  "upcast_attention": false,
69
- "use_linear_projection": true
70
  }
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.1",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
  "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
 
 
 
 
 
10
  "block_out_channels": [
11
  320,
12
  640,
 
18
  "class_embeddings_concat": false,
19
  "conv_in_kernel": 3,
20
  "conv_out_kernel": 3,
21
+ "cross_attention_dim": 768,
22
  "cross_attention_norm": null,
23
  "down_block_types": [
24
  "CrossAttnDownBlock2D",
 
32
  "encoder_hid_dim_type": null,
33
  "flip_sin_to_cos": true,
34
  "freq_shift": 0,
35
+ "in_channels": 4,
36
  "layers_per_block": 2,
37
  "mid_block_only_cross_attention": null,
38
  "mid_block_scale_factor": 1,
 
47
  "resnet_out_scale_factor": 1.0,
48
  "resnet_skip_time_act": false,
49
  "resnet_time_scale_shift": "default",
50
+ "sample_size": 64,
51
  "time_cond_proj_dim": null,
52
  "time_embedding_act_fn": null,
53
  "time_embedding_dim": null,
 
61
  "CrossAttnUpBlock2D"
62
  ],
63
  "upcast_attention": false,
64
+ "use_linear_projection": false
65
  }
unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87e1d440b0aca6f6e4590d30495a59c920fdb40419f5c9bf82dcd47b5bf21016
3
- size 3463946213
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39aeb5f57e936fdb52331f49d69299fb130a5456c269b67c08699b109e8485fd
3
+ size 3438375973
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.18.1",
4
- "_name_or_path": "stabilityai/stable-diffusion-2-depth",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
@@ -20,7 +20,7 @@
20
  "layers_per_block": 2,
21
  "norm_num_groups": 32,
22
  "out_channels": 3,
23
- "sample_size": 256,
24
  "scaling_factor": 0.18215,
25
  "up_block_types": [
26
  "UpDecoderBlock2D",
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.18.1",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
20
  "layers_per_block": 2,
21
  "norm_num_groups": 32,
22
  "out_channels": 3,
23
+ "sample_size": 512,
24
  "scaling_factor": 0.18215,
25
  "up_block_types": [
26
  "UpDecoderBlock2D",
vae/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:185b0c03485b4048bb6158de087df301b79ea187844c76ae91cd4cda207282a2
3
  size 334715569
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11a6fc35e77a2d5696ae6a494f797f01b7ab97b08b5f8f2f17e19d0ef169b1ca
3
  size 334715569