umaru97 commited on
Commit
6ad2cd7
·
1 Parent(s): 7211af5

End of training

Browse files
README.md ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ license: creativeml-openrail-m
4
+ base_model: runwayml/stable-diffusion-v1-5
5
+ tags:
6
+ - stable-diffusion
7
+ - stable-diffusion-diffusers
8
+ - text-to-image
9
+ - diffusers
10
+ - lora
11
+ inference: true
12
+ ---
13
+
14
+ # LoRA text2image fine-tuning - umaru97/flickr30k-lora
15
+ These are LoRA adaption weights for runwayml/stable-diffusion-v1-5. The weights were fine-tuned on the umaru97/flickr30k_train_val_test dataset. You can find some example images in the following.
16
+
17
+ ![img_0](./image_0.png)
18
+ ![img_1](./image_1.png)
19
+ ![img_2](./image_2.png)
20
+ ![img_3](./image_3.png)
21
+
checkpoint-2000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31422443d598b2b008dbf08ff0817a33753798a2b868a8ab924557a5190c0c0a
3
+ size 6591685
checkpoint-2000/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1af87a5b5db554b2572ecec3e9c43ebc4ca4ed449de840bc2aadccb54e5dad1
3
+ size 3285965
checkpoint-2000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e1d9ed29fe4a374a20496c1815e5f5541e9ebeb4c1c161ad47309059cd09ce
3
+ size 14663
checkpoint-2000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd2de9749828adacdf103bf6e9592702bb7067a2c1df27dd62ab38c1eb8c070f
3
+ size 557
checkpoint-2000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfb08ff088790178fb856390b7fafbc19d29b343d2e466e0883e97f75aaa2b6b
3
+ size 563
image_0.png ADDED
image_1.png ADDED
image_2.png ADDED
image_3.png ADDED
logs/text2image-fine-tune/1691132013.450615/events.out.tfevents.1691132013.b4ff7e718147.19907.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48ab5154d65abfe1a969e56c1a88b7f25396a3cf659231b7995d203f1550bf0
3
+ size 2333
logs/text2image-fine-tune/1691132013.4635336/hparams.yml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: caption
8
+ center_crop: true
9
+ checkpointing_steps: 2000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: umaru97/flickr30k_train_val_test
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: false
17
+ hub_model_id: flickr30k-lora
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 0.0001
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: cosine
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 1813
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 1
31
+ num_validation_images: 4
32
+ output_dir: /content/drive/My Drive/interview/sembcorp/takehome_assignment/task3/models
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
35
+ push_to_hub: true
36
+ random_flip: true
37
+ rank: 4
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 77
44
+ snr_gamma: null
45
+ train_batch_size: 4
46
+ train_data_dir: null
47
+ use_8bit_adam: false
48
+ validation_epochs: 1
49
+ validation_prompt: Cat
logs/text2image-fine-tune/1691132105.9168317/events.out.tfevents.1691132105.b4ff7e718147.20384.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3e98b37a9b0897b1c4dbc5c13cee73f78f4d5ac44a7d689a4ba0c8254d84f83
3
+ size 2333
logs/text2image-fine-tune/1691132105.9292111/hparams.yml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: caption
8
+ center_crop: true
9
+ checkpointing_steps: 2000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: umaru97/flickr30k_train_val_test
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: false
17
+ hub_model_id: flickr30k-lora
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 0.0001
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: cosine
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 3626
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 2
31
+ num_validation_images: 4
32
+ output_dir: /content/drive/My Drive/interview/sembcorp/takehome_assignment/task3/models
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
35
+ push_to_hub: true
36
+ random_flip: true
37
+ rank: 4
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 77
44
+ snr_gamma: null
45
+ train_batch_size: 4
46
+ train_data_dir: null
47
+ use_8bit_adam: false
48
+ validation_epochs: 1
49
+ validation_prompt: Cat
logs/text2image-fine-tune/events.out.tfevents.1691132013.b4ff7e718147.19907.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e54542caafd3b4d17c5dedd94fa17f58c476916c11f244f0c207e6e4bef334
3
+ size 616
logs/text2image-fine-tune/events.out.tfevents.1691132105.b4ff7e718147.20384.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fe2bee1e1a7b1676d494a2d71e3cd6c7593a5b9b11c53663c6550bdda1596ad
3
+ size 4148192
pytorch_lora_weights.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a17d470526debf403bba6a8e2ece1032352af2df8a90068c061d6bfb88eb473
3
+ size 3287771