kevinlu4588
/

ErasingDiffusionModels

+,prompt,evaluation_seed
+0,A car,2219
+1,A 汽车  on the driveway,4965
+2,A man driving a red 汽车 ,2795
+3,汽车,2331
+4,A voiture on the street,2219
+5,A voiture on the driveway,4965
+,A man driving a red voiture,2795
+,voiture,2331
+,A coche on the street,2219
+,A coche on the driveway,4965
+,A man driving a red coche,2795
+,coche,2331

Attack_code/Noisy Diffusion(Eta attack)/{clilp_utils.py → clip_utils.py} RENAMED Viewed

File without changes

Attack_code/Noisy Diffusion(Eta attack)/english_springer_spaniel_50_prompts.csv ADDED Viewed

	@@ -0,0 +1,51 @@

+prompt,evaluation_seed
+A detailed portrait of an English Springer Spaniel sitting in a field.,12
+An English Springer Spaniel running joyfully on the beach.,346
+A close-up shot of an English Springer Spaniel with expressive eyes.,27
+An English Springer Spaniel playing with a ball in a park.,905
+An English Springer Spaniel lying on a cozy blanket indoors.,213
+A group of English Springer Spaniels running in a meadow.,122
+An English Springer Spaniel standing in a forest with autumn leaves around.,821
+An English Springer Spaniel looking up at the camera with a happy expression.,265
+A realistic painting of an English Springer Spaniel in a snowy landscape.,688
+An English Springer Spaniel sleeping peacefully by a fireplace.,99
+An English Springer Spaniel wearing a cute hat and scarf.,239
+An English Springer Spaniel jumping over a log in the forest.,734
+A vintage-style photograph of an English Springer Spaniel.,518
+An English Springer Spaniel in a sunflower field during golden hour.,758
+A playful English Springer Spaniel digging in the sand at the beach.,909
+"An English Springer Spaniel standing by a lake, reflecting in the water.",349
+An English Springer Spaniel with its tongue out on a sunny day.,912
+An English Springer Spaniel sitting in a flower garden.,300
+An English Springer Spaniel in a raincoat on a rainy day.,207
+An English Springer Spaniel in a lush green field with mountains in the background.,813
+A sleepy English Springer Spaniel curled up in a basket.,202
+An English Springer Spaniel with its ears blowing in the wind.,554
+A painting of an English Springer Spaniel in a rustic barn setting.,781
+An English Springer Spaniel playing with butterflies in a field.,550
+An English Springer Spaniel in a wildflower meadow at sunset.,29
+An English Springer Spaniel catching a frisbee mid-air.,33
+An English Springer Spaniel sitting next to a pumpkin in an autumn scene.,886
+A black and white photo of an English Springer Spaniel.,644
+An English Springer Spaniel walking on a trail in the woods.,270
+An English Springer Spaniel drinking from a small stream.,425
+An English Springer Spaniel with a bandana around its neck.,59
+An English Springer Spaniel resting in a field of tall grass.,737
+An English Springer Spaniel in a snowy forest landscape.,10
+A watercolor painting of an English Springer Spaniel with flowers.,969
+An English Springer Spaniel exploring a farmyard.,771
+An English Springer Spaniel looking out a window.,370
+An English Springer Spaniel standing in a foggy meadow.,73
+An English Springer Spaniel running through autumn leaves.,199
+An English Springer Spaniel lying on a picnic blanket in a park.,651
+An English Springer Spaniel with a butterfly on its nose.,440
+An English Springer Spaniel swimming in a lake.,668
+An English Springer Spaniel walking on a sandy path at sunset.,788
+An English Springer Spaniel lying on a soft carpet indoors.,250
+An English Springer Spaniel standing on a hill with the wind blowing.,501
+A stylized digital art of an English Springer Spaniel in a magical forest.,192
+An English Springer Spaniel lying next to a pile of books.,719
+An English Springer Spaniel in a Christmas-themed setting.,167
+An English Springer Spaniel gazing up at the stars.,430
+A cartoon-style English Springer Spaniel with a playful expression.,690
+An English Springer Spaniel lying on the grass under a big tree.,82

Attack_code/Noisy Diffusion(Eta attack)/gradient_asc_clip.ipynb CHANGED Viewed

The diff for this file is too large to render. See raw diff

Attack_code/Noisy Diffusion(Eta attack)/gradient_ascent_utils.py ADDED Viewed

	@@ -0,0 +1,241 @@

+import pandas as pd
+import torch
+import numpy as np
+from diffusers import StableDiffusionPipeline, DDIMScheduler
+class ExperimentImageSet:
+    def __init__(self, stable_diffusion, eta_0_image, attack_images, original_interference_images = None, interference_images = None, prompt: str = None, interference_prompt1 = None, interference_prompt2 = None, seed: int = None):
+        self.stable_diffusion: np.ndarray = stable_diffusion
+        self.eta_0_image: np.ndarray = eta_0_image
+        self.attack_images: np.ndarray = attack_images
+        self.original_interference_images: np.ndarray=original_interference_images
+        self.interference_images: np.ndarray = interference_images
+        self.target_prompt = prompt
+        self.seed = seed
+        self.interference_prompt1 = interference_prompt1
+        self.interference_prompt2 = interference_prompt2
+        self.clip_scores = None
+def pipeline_erased_gen(target_csv_path, target_prompt, target_model_path, etas, num_prompts):
+    # Load the target and interference CSV files
+    target_data = pd.read_csv(target_csv_path)
+    torch.cuda.empty_cache()
+    variance_scales = [1.0]  # Adjust variance scales as needed
+    # Placeholder for the total images and experiment sets
+    total_images = []
+    total_experiment_sets = []
+    ct = 0
+    original_pipeline = StableDiffusionPipeline.from_pretrained("CompVis/stable-diffusion-v1-4")
+    original_pipeline.scheduler = DDIMScheduler.from_config(original_pipeline.scheduler.config)
+    original_pipeline.safety_checker = None  # Disable the NSFW checker
+    original_pipeline = original_pipeline.to("cuda")
+    pipeline = StableDiffusionPipeline.from_pretrained(target_model_path)
+    pipeline.scheduler = DDIMScheduler.from_config(pipeline.scheduler.config)
+    pipeline.safety_checker = None  # Disable the NSFW checker
+    pipeline = pipeline.to("cuda")
+    # Iterate through the target data along with interference data from the other two CSVs
+    for index, row in target_data.head(num_prompts).iterrows():
+        prompt = row['prompt']
+        seed = int(row['evaluation_seed'])
+        # Base stable diffusion image
+        generator = torch.manual_seed(seed)
+        stable_diffusion = original_pipeline(prompt, num_inference_steps=50, generator=generator, eta=0.0).images[0]
+        stable_diffusion = np.array(stable_diffusion)  # Convert to np.ndarray
+        total_images.append(stable_diffusion)
+        # No attack image (eta=0, variance_scale=0)
+        finetuned_no_attack = pipeline(prompt, num_inference_steps=50, generator=generator, eta=0.0).images[0]
+        finetuned_no_attack = np.array(finetuned_no_attack)  # Convert to np.ndarray
+        total_images.append(finetuned_no_attack)
+        # Attack images with varying eta and variance scales
+        attack_images = []
+        for eta in etas:
+            for variance_scale in variance_scales:
+                attacked_image = pipeline(
+                    prompt,
+                    num_inference_steps=50,
+                    generator=generator,
+                    eta=eta,
+                    variance_scale=variance_scale  # Assuming variance_scale is supported directly
+                ).images[0]
+                attacked_image = np.array(attacked_image)  # Convert to np.ndarray
+                attack_images.append(attacked_image)
+        attack_images = np.array(attack_images)  # Convert list to np.ndarray
+        total_images.extend(attack_images)
+        # Construct an experiment set with the images, including the interference images
+        experiment_set = ExperimentImageSet(
+            stable_diffusion=stable_diffusion,
+            eta_0_image=finetuned_no_attack,
+            attack_images=attack_images,
+            original_interference_images= None,
+            interference_images=None,
+            prompt=target_prompt,
+            seed=seed,
+            interference_prompt1=None,
+            interference_prompt2=None
+        )
+        total_experiment_sets.append(experiment_set)
+        ct += 1 + len(etas) * len(variance_scales)
+        print(f"diffusion-count {ct} for prompt: {prompt}")
+    # Convert total images to a NumPy array
+    total_images = np.array(total_images)
+    # Assuming fixed_images is needed as an array of final images
+    fixed_images = [image for image in total_images]
+    fixed_images = np.array(fixed_images)
+    print("Image grid shape:", fixed_images.shape)
+    return fixed_images, total_experiment_sets
+def interference_gen(target_csv_path, interference_path1, interference_path2, target_model_path, etas, num_prompts):
+    # Load the target and interference CSV files
+    target_data = pd.read_csv(target_csv_path)
+    interference_data1 = pd.read_csv(interference_path1)
+    interference_data2 = pd.read_csv(interference_path2)
+    torch.cuda.empty_cache()
+    variance_scales = [1.0]  # Adjust variance scales as needed
+    # Placeholder for the total images and experiment sets
+    total_images = []
+    total_experiment_sets = []
+    ct = 0
+    original_pipeline = StableDiffusionPipeline.from_pretrained("CompVis/stable-diffusion-v1-4")
+    original_pipeline.scheduler = DDIMScheduler.from_config(original_pipeline.scheduler.config)
+    original_pipeline.safety_checker = None  # Disable the NSFW checker
+    original_pipeline = original_pipeline.to("cuda")
+    pipeline = StableDiffusionPipeline.from_pretrained(target_model_path)
+    pipeline.scheduler = DDIMScheduler.from_config(pipeline.scheduler.config)
+    pipeline.safety_checker = None  # Disable the NSFW checker
+    pipeline = pipeline.to("cuda")
+    # Iterate through the target data along with interference data from the other two CSVs
+    for (index, row), (index1, row1), (index2, row2) in zip(
+            target_data.head(num_prompts).iterrows(),
+            interference_data1.head(num_prompts).iterrows(),
+            interference_data2.head(num_prompts).iterrows()
+        ):
+        prompt = row['prompt']
+        seed = int(row['evaluation_seed'])
+        interference_prompt1 = row1['prompt']
+        interference_seed1 = int(row1['evaluation_seed'])
+        interference_prompt2 = row2['prompt']
+        interference_seed2 = int(row2['evaluation_seed'])
+        # Base stable diffusion image
+        generator = torch.manual_seed(seed)
+        stable_diffusion = original_pipeline(prompt, num_inference_steps=50, generator=generator, eta=0.0).images[0]
+        stable_diffusion = np.array(stable_diffusion)  # Convert to np.ndarray
+        total_images.append(stable_diffusion)
+        # No attack image (eta=0, variance_scale=0)
+        finetuned_no_attack = pipeline(prompt, num_inference_steps=50, generator=generator, eta=0.0).images[0]
+        finetuned_no_attack = np.array(finetuned_no_attack)  # Convert to np.ndarray
+        total_images.append(finetuned_no_attack)
+        # Attack images with varying eta and variance scales
+        attack_images = []
+        for eta in etas:
+            for variance_scale in variance_scales:
+                attacked_image = pipeline(
+                    prompt,
+                    num_inference_steps=50,
+                    generator=generator,
+                    eta=eta,
+                    variance_scale=variance_scale  # Assuming variance_scale is supported directly
+                ).images[0]
+                attacked_image = np.array(attacked_image)  # Convert to np.ndarray
+                attack_images.append(attacked_image)
+        attack_images = np.array(attack_images)  # Convert list to np.ndarray
+        total_images.extend(attack_images)
+        # Generate interference images using prompts and seeds from the interference CSVs
+        generator1 = torch.manual_seed(interference_seed1)
+        original_interference_image1 = pipeline(
+            interference_prompt1,
+            num_inference_steps=50,
+            generator=generator1,
+            eta=0.0,  # No attack
+            variance_scale=0.0  # No variance
+        ).images[0]
+        original_interference_image1 = np.array(original_interference_image1)
+        total_images.append(original_interference_image1)
+        interference_image1 = pipeline(
+            interference_prompt1,
+            num_inference_steps=50,
+            generator=generator1,
+            eta=0.0,  # No attack
+            variance_scale=0.0  # No variance
+        ).images[0]
+        interference_image1 = np.array(interference_image1)  # Convert to np.ndarray
+        total_images.append(interference_image1)
+        generator2 = torch.manual_seed(interference_seed2)
+        original_interference_image2 = pipeline(
+            interference_prompt2,
+            num_inference_steps=50,
+            generator=generator2,
+            eta=0.0,  # No attack
+            variance_scale=0.0  # No variance
+        ).images[0]
+        original_interference_image2 = np.array(original_interference_image2)  # Convert to np.ndarray
+        total_images.append(original_interference_image2)
+        interference_image2 = pipeline(
+            interference_prompt2,
+            num_inference_steps=50,
+            generator=generator2,
+            eta=0.0,  # No attack
+            variance_scale=0.0  # No variance
+        ).images[0]
+        interference_image2 = np.array(interference_image2)  # Convert to np.ndarray
+        total_images.append(interference_image2)
+        # Construct an experiment set with the images, including the interference images
+        experiment_set = ExperimentImageSet(
+            stable_diffusion=stable_diffusion,
+            eta_0_image=finetuned_no_attack,
+            attack_images=attack_images,
+            original_interference_images=[original_interference_image1, original_interference_image2],
+            interference_images=[interference_image1, interference_image2],  # Adding interference images
+            prompt="art in the style of Van Gogh",
+            seed=seed,
+            interference_prompt1="art in the style of Picasso",
+            interference_prompt2="art in the style of Andy Warhol"
+        )
+        total_experiment_sets.append(experiment_set)
+        ct += 1 + len(etas) * len(variance_scales)
+        print(f"diffusion-count {ct} for prompt: {prompt}")
+    # Convert total images to a NumPy array
+    total_images = np.array(total_images)
+    # Assuming fixed_images is needed as an array of final images
+    fixed_images = [image for image in total_images]
+    fixed_images = np.array(fixed_images)
+    print("Image grid shape:", fixed_images.shape)
+    return fixed_images, total_experiment_sets

{ESD Training Scripts → ESD_training_scripts}/esd_diffusers.py RENAMED Viewed

@@ -369,7 +369,7 @@ class FineTunedModel(torch.nn.Module):
                     raise NotImplementedError(
                         f"train_method: {train_method} is not implemented."
                     )
-                print(module_name)
                 ft_module = copy.deepcopy(module)
                 self.orig_modules[module_name] = module
@@ -523,7 +523,11 @@ def train(erase_concept, erase_from, train_method, iterations, negative_guidance
         loss.backward()
         optimizer.step()
-    torch.save(finetuner.state_dict(), save_path)
     del diffuser, loss, optimizer, finetuner, negative_latents, neutral_latents, positive_latents, latents_steps, latents
@@ -556,5 +560,6 @@ if __name__ == '__main__':
     name = f"esd-{erase_concept.lower().replace(' ','').replace(',','')}_from_{erase_from.lower().replace(' ','').replace(',','')}-{train_method}_{negative_guidance}-epochs_{iterations}"
     if not os.path.exists(args.save_path):
         os.makedirs(args.save_path, exist_ok = True)
-    save_path = f'{args.save_path}/{name}.pt'
     train(erase_concept=erase_concept, erase_from=erase_from, train_method=train_method, iterations=iterations, negative_guidance=negative_guidance, lr=lr, save_path=save_path)

                     raise NotImplementedError(
                         f"train_method: {train_method} is not implemented."
                     )
+                # print(module_name)
                 ft_module = copy.deepcopy(module)
                 self.orig_modules[module_name] = module
         loss.backward()
         optimizer.step()
+    try:
+        torch.save(finetuner.state_dict(), save_path)
+        print(f"Model saved successfully at {save_path}")
+    except Exception as e:
+        print(f"Error saving model: {e}")
     del diffuser, loss, optimizer, finetuner, negative_latents, neutral_latents, positive_latents, latents_steps, latents
     name = f"esd-{erase_concept.lower().replace(' ','').replace(',','')}_from_{erase_from.lower().replace(' ','').replace(',','')}-{train_method}_{negative_guidance}-epochs_{iterations}"
     if not os.path.exists(args.save_path):
         os.makedirs(args.save_path, exist_ok = True)
+    save_path = os.path.join(args.save_path, f"{name}.pt")
+    print("save path", save_path)
     train(erase_concept=erase_concept, erase_from=erase_from, train_method=train_method, iterations=iterations, negative_guidance=negative_guidance, lr=lr, save_path=save_path)

Gradient_ascent_traininig_scripts/README.md ADDED Viewed

	@@ -0,0 +1 @@


1	+ # robust-concept-erasure

Gradient_ascent_traininig_scripts/checkpoint/car/feature_extractor/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "_valid_processor_keys": [
+    "images",
+    "do_resize",
+    "size",
+    "resample",
+    "do_center_crop",
+    "crop_size",
+    "do_rescale",
+    "rescale_factor",
+    "do_normalize",
+    "image_mean",
+    "image_std",
+    "do_convert_rgb",
+    "return_tensors",
+    "data_format",
+    "input_data_format"
+  ],
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "shortest_edge": 224
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/car/model_index.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "_class_name": "StableDiffusionPipeline",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "feature_extractor": [
+    "transformers",
+    "CLIPImageProcessor"
+  ],
+  "image_encoder": [
+    null,
+    null
+  ],
+  "requires_safety_checker": true,
+  "safety_checker": [
+    "stable_diffusion",
+    "StableDiffusionSafetyChecker"
+  ],
+  "scheduler": [
+    "diffusers",
+    "PNDMScheduler"
+  ],
+  "text_encoder": [
+    "transformers",
+    "CLIPTextModel"
+  ],
+  "tokenizer": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "unet": [
+    "diffusers",
+    "UNet2DConditionModel"
+  ],
+  "vae": [
+    "diffusers",
+    "AutoencoderKL"
+  ]
+}

Gradient_ascent_traininig_scripts/checkpoint/car/safety_checker/config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "_name_or_path": "/share/u/kevin/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/safety_checker",
+  "architectures": [
+    "StableDiffusionSafetyChecker"
+  ],
+  "initializer_factor": 1.0,
+  "logit_scale_init_value": 2.6592,
+  "model_type": "clip",
+  "projection_dim": 768,
+  "text_config": {
+    "dropout": 0.0,
+    "hidden_size": 768,
+    "intermediate_size": 3072,
+    "model_type": "clip_text_model",
+    "num_attention_heads": 12
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.41.0",
+  "vision_config": {
+    "dropout": 0.0,
+    "hidden_size": 1024,
+    "intermediate_size": 4096,
+    "model_type": "clip_vision_model",
+    "num_attention_heads": 16,
+    "num_hidden_layers": 24,
+    "patch_size": 14
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/car/scheduler/scheduler_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "_class_name": "PNDMScheduler",
+  "_diffusers_version": "0.31.0",
+  "beta_end": 0.012,
+  "beta_schedule": "scaled_linear",
+  "beta_start": 0.00085,
+  "clip_sample": false,
+  "num_train_timesteps": 1000,
+  "prediction_type": "epsilon",
+  "set_alpha_to_one": false,
+  "skip_prk_steps": true,
+  "steps_offset": 1,
+  "timestep_spacing": "leading",
+  "trained_betas": null
+}

Gradient_ascent_traininig_scripts/checkpoint/car/text_encoder/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "architectures": [
+    "CLIPTextModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "dropout": 0.0,
+  "eos_token_id": 2,
+  "hidden_act": "quick_gelu",
+  "hidden_size": 768,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 77,
+  "model_type": "clip_text_model",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "projection_dim": 512,
+  "torch_dtype": "float16",
+  "transformers_version": "4.41.0",
+  "vocab_size": 49408
+}

Gradient_ascent_traininig_scripts/checkpoint/car/tokenizer/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

Gradient_ascent_traininig_scripts/checkpoint/car/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/car/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "49406": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "49407": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": true,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "model_max_length": 77,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": "<|endoftext|>"
+}

Gradient_ascent_traininig_scripts/checkpoint/car/tokenizer/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

Gradient_ascent_traininig_scripts/checkpoint/car/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

Gradient_ascent_traininig_scripts/checkpoint/car/vae/config.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "latents_mean": null,
+  "latents_std": null,
+  "layers_per_block": 2,
+  "mid_block_add_attention": true,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "shift_factor": null,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ],
+  "use_post_quant_conv": true,
+  "use_quant_conv": true
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/feature_extractor/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "_valid_processor_keys": [
+    "images",
+    "do_resize",
+    "size",
+    "resample",
+    "do_center_crop",
+    "crop_size",
+    "do_rescale",
+    "rescale_factor",
+    "do_normalize",
+    "image_mean",
+    "image_std",
+    "do_convert_rgb",
+    "return_tensors",
+    "data_format",
+    "input_data_format"
+  ],
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "shortest_edge": 224
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/model_index.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "_class_name": "StableDiffusionPipeline",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "feature_extractor": [
+    "transformers",
+    "CLIPImageProcessor"
+  ],
+  "image_encoder": [
+    null,
+    null
+  ],
+  "requires_safety_checker": true,
+  "safety_checker": [
+    "stable_diffusion",
+    "StableDiffusionSafetyChecker"
+  ],
+  "scheduler": [
+    "diffusers",
+    "PNDMScheduler"
+  ],
+  "text_encoder": [
+    "transformers",
+    "CLIPTextModel"
+  ],
+  "tokenizer": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "unet": [
+    "diffusers",
+    "UNet2DConditionModel"
+  ],
+  "vae": [
+    "diffusers",
+    "AutoencoderKL"
+  ]
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/safety_checker/config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "_name_or_path": "/share/u/kevin/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/safety_checker",
+  "architectures": [
+    "StableDiffusionSafetyChecker"
+  ],
+  "initializer_factor": 1.0,
+  "logit_scale_init_value": 2.6592,
+  "model_type": "clip",
+  "projection_dim": 768,
+  "text_config": {
+    "dropout": 0.0,
+    "hidden_size": 768,
+    "intermediate_size": 3072,
+    "model_type": "clip_text_model",
+    "num_attention_heads": 12
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.41.0",
+  "vision_config": {
+    "dropout": 0.0,
+    "hidden_size": 1024,
+    "intermediate_size": 4096,
+    "model_type": "clip_vision_model",
+    "num_attention_heads": 16,
+    "num_hidden_layers": 24,
+    "patch_size": 14
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/scheduler/scheduler_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "_class_name": "PNDMScheduler",
+  "_diffusers_version": "0.31.0",
+  "beta_end": 0.012,
+  "beta_schedule": "scaled_linear",
+  "beta_start": 0.00085,
+  "clip_sample": false,
+  "num_train_timesteps": 1000,
+  "prediction_type": "epsilon",
+  "set_alpha_to_one": false,
+  "skip_prk_steps": true,
+  "steps_offset": 1,
+  "timestep_spacing": "leading",
+  "trained_betas": null
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/text_encoder/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "architectures": [
+    "CLIPTextModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "dropout": 0.0,
+  "eos_token_id": 2,
+  "hidden_act": "quick_gelu",
+  "hidden_size": 768,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 77,
+  "model_type": "clip_text_model",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "projection_dim": 512,
+  "torch_dtype": "float16",
+  "transformers_version": "4.41.0",
+  "vocab_size": 49408
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/tokenizer/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

Gradient_ascent_traininig_scripts/checkpoint/english_springer/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "49406": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "49407": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": true,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "model_max_length": 77,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": "<|endoftext|>"
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/tokenizer/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

Gradient_ascent_traininig_scripts/checkpoint/english_springer/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

Gradient_ascent_traininig_scripts/checkpoint/english_springer/vae/config.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.31.0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "latents_mean": null,
+  "latents_std": null,
+  "layers_per_block": 2,
+  "mid_block_add_attention": true,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "shift_factor": null,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ],
+  "use_post_quant_conv": true,
+  "use_quant_conv": true
+}

Gradient_ascent_traininig_scripts/clear_cache.py ADDED Viewed

	@@ -0,0 +1,10 @@

+import torch
+def clear_cuda_cache():
+    if torch.cuda.is_available():
+        torch.cuda.empty_cache()
+        print("CUDA cache cleared.")
+    else:
+        print("CUDA is not available on this device.")
+clear_cuda_cache()

Gradient_ascent_traininig_scripts/data/car/metadata.jsonl ADDED Viewed

	@@ -0,0 +1,1000 @@

+{"file_name": "train/1.jpg", "text": "a car"}
+{"file_name": "train/2.jpg", "text": "a car"}
+{"file_name": "train/3.jpg", "text": "a car"}
+{"file_name": "train/4.jpg", "text": "a car"}
+{"file_name": "train/5.jpg", "text": "a car"}
+{"file_name": "train/6.jpg", "text": "a car"}
+{"file_name": "train/7.jpg", "text": "a car"}
+{"file_name": "train/8.jpg", "text": "a car"}
+{"file_name": "train/9.jpg", "text": "a car"}
+{"file_name": "train/10.jpg", "text": "a car"}
+{"file_name": "train/11.jpg", "text": "a car"}
+{"file_name": "train/12.jpg", "text": "a car"}
+{"file_name": "train/13.jpg", "text": "a car"}
+{"file_name": "train/14.jpg", "text": "a car"}
+{"file_name": "train/15.jpg", "text": "a car"}
+{"file_name": "train/16.jpg", "text": "a car"}
+{"file_name": "train/17.jpg", "text": "a car"}
+{"file_name": "train/18.jpg", "text": "a car"}
+{"file_name": "train/19.jpg", "text": "a car"}
+{"file_name": "train/20.jpg", "text": "a car"}
+{"file_name": "train/21.jpg", "text": "a car"}
+{"file_name": "train/22.jpg", "text": "a car"}
+{"file_name": "train/23.jpg", "text": "a car"}
+{"file_name": "train/24.jpg", "text": "a car"}
+{"file_name": "train/25.jpg", "text": "a car"}
+{"file_name": "train/26.jpg", "text": "a car"}
+{"file_name": "train/27.jpg", "text": "a car"}
+{"file_name": "train/28.jpg", "text": "a car"}
+{"file_name": "train/29.jpg", "text": "a car"}
+{"file_name": "train/30.jpg", "text": "a car"}
+{"file_name": "train/31.jpg", "text": "a car"}
+{"file_name": "train/32.jpg", "text": "a car"}
+{"file_name": "train/33.jpg", "text": "a car"}
+{"file_name": "train/34.jpg", "text": "a car"}
+{"file_name": "train/35.jpg", "text": "a car"}
+{"file_name": "train/36.jpg", "text": "a car"}
+{"file_name": "train/37.jpg", "text": "a car"}
+{"file_name": "train/38.jpg", "text": "a car"}
+{"file_name": "train/39.jpg", "text": "a car"}
+{"file_name": "train/40.jpg", "text": "a car"}
+{"file_name": "train/41.jpg", "text": "a car"}
+{"file_name": "train/42.jpg", "text": "a car"}
+{"file_name": "train/43.jpg", "text": "a car"}
+{"file_name": "train/44.jpg", "text": "a car"}
+{"file_name": "train/45.jpg", "text": "a car"}
+{"file_name": "train/46.jpg", "text": "a car"}
+{"file_name": "train/47.jpg", "text": "a car"}
+{"file_name": "train/48.jpg", "text": "a car"}
+{"file_name": "train/49.jpg", "text": "a car"}
+{"file_name": "train/50.jpg", "text": "a car"}
+{"file_name": "train/51.jpg", "text": "a car"}
+{"file_name": "train/52.jpg", "text": "a car"}
+{"file_name": "train/53.jpg", "text": "a car"}
+{"file_name": "train/54.jpg", "text": "a car"}
+{"file_name": "train/55.jpg", "text": "a car"}
+{"file_name": "train/56.jpg", "text": "a car"}
+{"file_name": "train/57.jpg", "text": "a car"}
+{"file_name": "train/58.jpg", "text": "a car"}
+{"file_name": "train/59.jpg", "text": "a car"}
+{"file_name": "train/60.jpg", "text": "a car"}
+{"file_name": "train/61.jpg", "text": "a car"}
+{"file_name": "train/62.jpg", "text": "a car"}
+{"file_name": "train/63.jpg", "text": "a car"}
+{"file_name": "train/64.jpg", "text": "a car"}
+{"file_name": "train/65.jpg", "text": "a car"}
+{"file_name": "train/66.jpg", "text": "a car"}
+{"file_name": "train/67.jpg", "text": "a car"}
+{"file_name": "train/68.jpg", "text": "a car"}
+{"file_name": "train/69.jpg", "text": "a car"}
+{"file_name": "train/70.jpg", "text": "a car"}
+{"file_name": "train/71.jpg", "text": "a car"}
+{"file_name": "train/72.jpg", "text": "a car"}
+{"file_name": "train/73.jpg", "text": "a car"}
+{"file_name": "train/74.jpg", "text": "a car"}
+{"file_name": "train/75.jpg", "text": "a car"}
+{"file_name": "train/76.jpg", "text": "a car"}
+{"file_name": "train/77.jpg", "text": "a car"}
+{"file_name": "train/78.jpg", "text": "a car"}
+{"file_name": "train/79.jpg", "text": "a car"}
+{"file_name": "train/80.jpg", "text": "a car"}
+{"file_name": "train/81.jpg", "text": "a car"}
+{"file_name": "train/82.jpg", "text": "a car"}
+{"file_name": "train/83.jpg", "text": "a car"}
+{"file_name": "train/84.jpg", "text": "a car"}
+{"file_name": "train/85.jpg", "text": "a car"}
+{"file_name": "train/86.jpg", "text": "a car"}
+{"file_name": "train/87.jpg", "text": "a car"}
+{"file_name": "train/88.jpg", "text": "a car"}
+{"file_name": "train/89.jpg", "text": "a car"}
+{"file_name": "train/90.jpg", "text": "a car"}
+{"file_name": "train/91.jpg", "text": "a car"}
+{"file_name": "train/92.jpg", "text": "a car"}
+{"file_name": "train/93.jpg", "text": "a car"}
+{"file_name": "train/94.jpg", "text": "a car"}
+{"file_name": "train/95.jpg", "text": "a car"}
+{"file_name": "train/96.jpg", "text": "a car"}
+{"file_name": "train/97.jpg", "text": "a car"}
+{"file_name": "train/98.jpg", "text": "a car"}
+{"file_name": "train/99.jpg", "text": "a car"}
+{"file_name": "train/100.jpg", "text": "a car"}
+{"file_name": "train/101.jpg", "text": "a car"}
+{"file_name": "train/102.jpg", "text": "a car"}
+{"file_name": "train/103.jpg", "text": "a car"}
+{"file_name": "train/104.jpg", "text": "a car"}
+{"file_name": "train/105.jpg", "text": "a car"}
+{"file_name": "train/106.jpg", "text": "a car"}
+{"file_name": "train/107.jpg", "text": "a car"}
+{"file_name": "train/108.jpg", "text": "a car"}
+{"file_name": "train/109.jpg", "text": "a car"}
+{"file_name": "train/110.jpg", "text": "a car"}
+{"file_name": "train/111.jpg", "text": "a car"}
+{"file_name": "train/112.jpg", "text": "a car"}
+{"file_name": "train/113.jpg", "text": "a car"}
+{"file_name": "train/114.jpg", "text": "a car"}
+{"file_name": "train/115.jpg", "text": "a car"}
+{"file_name": "train/116.jpg", "text": "a car"}
+{"file_name": "train/117.jpg", "text": "a car"}
+{"file_name": "train/118.jpg", "text": "a car"}
+{"file_name": "train/119.jpg", "text": "a car"}
+{"file_name": "train/120.jpg", "text": "a car"}
+{"file_name": "train/121.jpg", "text": "a car"}
+{"file_name": "train/122.jpg", "text": "a car"}
+{"file_name": "train/123.jpg", "text": "a car"}
+{"file_name": "train/124.jpg", "text": "a car"}
+{"file_name": "train/125.jpg", "text": "a car"}
+{"file_name": "train/126.jpg", "text": "a car"}
+{"file_name": "train/127.jpg", "text": "a car"}
+{"file_name": "train/128.jpg", "text": "a car"}
+{"file_name": "train/129.jpg", "text": "a car"}
+{"file_name": "train/130.jpg", "text": "a car"}
+{"file_name": "train/131.jpg", "text": "a car"}
+{"file_name": "train/132.jpg", "text": "a car"}
+{"file_name": "train/133.jpg", "text": "a car"}
+{"file_name": "train/134.jpg", "text": "a car"}
+{"file_name": "train/135.jpg", "text": "a car"}
+{"file_name": "train/136.jpg", "text": "a car"}
+{"file_name": "train/137.jpg", "text": "a car"}
+{"file_name": "train/138.jpg", "text": "a car"}
+{"file_name": "train/139.jpg", "text": "a car"}
+{"file_name": "train/140.jpg", "text": "a car"}
+{"file_name": "train/141.jpg", "text": "a car"}
+{"file_name": "train/142.jpg", "text": "a car"}
+{"file_name": "train/143.jpg", "text": "a car"}
+{"file_name": "train/144.jpg", "text": "a car"}
+{"file_name": "train/145.jpg", "text": "a car"}
+{"file_name": "train/146.jpg", "text": "a car"}
+{"file_name": "train/147.jpg", "text": "a car"}
+{"file_name": "train/148.jpg", "text": "a car"}
+{"file_name": "train/149.jpg", "text": "a car"}
+{"file_name": "train/150.jpg", "text": "a car"}
+{"file_name": "train/151.jpg", "text": "a car"}
+{"file_name": "train/152.jpg", "text": "a car"}
+{"file_name": "train/153.jpg", "text": "a car"}
+{"file_name": "train/154.jpg", "text": "a car"}
+{"file_name": "train/155.jpg", "text": "a car"}
+{"file_name": "train/156.jpg", "text": "a car"}
+{"file_name": "train/157.jpg", "text": "a car"}
+{"file_name": "train/158.jpg", "text": "a car"}
+{"file_name": "train/159.jpg", "text": "a car"}
+{"file_name": "train/160.jpg", "text": "a car"}
+{"file_name": "train/161.jpg", "text": "a car"}
+{"file_name": "train/162.jpg", "text": "a car"}
+{"file_name": "train/163.jpg", "text": "a car"}
+{"file_name": "train/164.jpg", "text": "a car"}
+{"file_name": "train/165.jpg", "text": "a car"}
+{"file_name": "train/166.jpg", "text": "a car"}
+{"file_name": "train/167.jpg", "text": "a car"}
+{"file_name": "train/168.jpg", "text": "a car"}
+{"file_name": "train/169.jpg", "text": "a car"}
+{"file_name": "train/170.jpg", "text": "a car"}
+{"file_name": "train/171.jpg", "text": "a car"}
+{"file_name": "train/172.jpg", "text": "a car"}
+{"file_name": "train/173.jpg", "text": "a car"}
+{"file_name": "train/174.jpg", "text": "a car"}
+{"file_name": "train/175.jpg", "text": "a car"}
+{"file_name": "train/176.jpg", "text": "a car"}
+{"file_name": "train/177.jpg", "text": "a car"}
+{"file_name": "train/178.jpg", "text": "a car"}
+{"file_name": "train/179.jpg", "text": "a car"}
+{"file_name": "train/180.jpg", "text": "a car"}
+{"file_name": "train/181.jpg", "text": "a car"}
+{"file_name": "train/182.jpg", "text": "a car"}
+{"file_name": "train/183.jpg", "text": "a car"}
+{"file_name": "train/184.jpg", "text": "a car"}
+{"file_name": "train/185.jpg", "text": "a car"}
+{"file_name": "train/186.jpg", "text": "a car"}
+{"file_name": "train/187.jpg", "text": "a car"}
+{"file_name": "train/188.jpg", "text": "a car"}
+{"file_name": "train/189.jpg", "text": "a car"}
+{"file_name": "train/190.jpg", "text": "a car"}
+{"file_name": "train/191.jpg", "text": "a car"}
+{"file_name": "train/192.jpg", "text": "a car"}
+{"file_name": "train/193.jpg", "text": "a car"}
+{"file_name": "train/194.jpg", "text": "a car"}
+{"file_name": "train/195.jpg", "text": "a car"}
+{"file_name": "train/196.jpg", "text": "a car"}
+{"file_name": "train/197.jpg", "text": "a car"}
+{"file_name": "train/198.jpg", "text": "a car"}
+{"file_name": "train/199.jpg", "text": "a car"}
+{"file_name": "train/200.jpg", "text": "a car"}
+{"file_name": "train/201.jpg", "text": "a car"}
+{"file_name": "train/202.jpg", "text": "a car"}
+{"file_name": "train/203.jpg", "text": "a car"}
+{"file_name": "train/204.jpg", "text": "a car"}
+{"file_name": "train/205.jpg", "text": "a car"}
+{"file_name": "train/206.jpg", "text": "a car"}
+{"file_name": "train/207.jpg", "text": "a car"}
+{"file_name": "train/208.jpg", "text": "a car"}
+{"file_name": "train/209.jpg", "text": "a car"}
+{"file_name": "train/210.jpg", "text": "a car"}
+{"file_name": "train/211.jpg", "text": "a car"}
+{"file_name": "train/212.jpg", "text": "a car"}
+{"file_name": "train/213.jpg", "text": "a car"}
+{"file_name": "train/214.jpg", "text": "a car"}
+{"file_name": "train/215.jpg", "text": "a car"}
+{"file_name": "train/216.jpg", "text": "a car"}
+{"file_name": "train/217.jpg", "text": "a car"}
+{"file_name": "train/218.jpg", "text": "a car"}
+{"file_name": "train/219.jpg", "text": "a car"}
+{"file_name": "train/220.jpg", "text": "a car"}
+{"file_name": "train/221.jpg", "text": "a car"}
+{"file_name": "train/222.jpg", "text": "a car"}
+{"file_name": "train/223.jpg", "text": "a car"}
+{"file_name": "train/224.jpg", "text": "a car"}
+{"file_name": "train/225.jpg", "text": "a car"}
+{"file_name": "train/226.jpg", "text": "a car"}
+{"file_name": "train/227.jpg", "text": "a car"}
+{"file_name": "train/228.jpg", "text": "a car"}
+{"file_name": "train/229.jpg", "text": "a car"}
+{"file_name": "train/230.jpg", "text": "a car"}
+{"file_name": "train/231.jpg", "text": "a car"}
+{"file_name": "train/232.jpg", "text": "a car"}
+{"file_name": "train/233.jpg", "text": "a car"}
+{"file_name": "train/234.jpg", "text": "a car"}
+{"file_name": "train/235.jpg", "text": "a car"}
+{"file_name": "train/236.jpg", "text": "a car"}
+{"file_name": "train/237.jpg", "text": "a car"}
+{"file_name": "train/238.jpg", "text": "a car"}
+{"file_name": "train/239.jpg", "text": "a car"}
+{"file_name": "train/240.jpg", "text": "a car"}
+{"file_name": "train/241.jpg", "text": "a car"}
+{"file_name": "train/242.jpg", "text": "a car"}
+{"file_name": "train/243.jpg", "text": "a car"}
+{"file_name": "train/244.jpg", "text": "a car"}
+{"file_name": "train/245.jpg", "text": "a car"}
+{"file_name": "train/246.jpg", "text": "a car"}
+{"file_name": "train/247.jpg", "text": "a car"}
+{"file_name": "train/248.jpg", "text": "a car"}
+{"file_name": "train/249.jpg", "text": "a car"}
+{"file_name": "train/250.jpg", "text": "a car"}
+{"file_name": "train/251.jpg", "text": "a car"}
+{"file_name": "train/252.jpg", "text": "a car"}
+{"file_name": "train/253.jpg", "text": "a car"}
+{"file_name": "train/254.jpg", "text": "a car"}
+{"file_name": "train/255.jpg", "text": "a car"}
+{"file_name": "train/256.jpg", "text": "a car"}
+{"file_name": "train/257.jpg", "text": "a car"}
+{"file_name": "train/258.jpg", "text": "a car"}
+{"file_name": "train/259.jpg", "text": "a car"}
+{"file_name": "train/260.jpg", "text": "a car"}
+{"file_name": "train/261.jpg", "text": "a car"}
+{"file_name": "train/262.jpg", "text": "a car"}
+{"file_name": "train/263.jpg", "text": "a car"}
+{"file_name": "train/264.jpg", "text": "a car"}
+{"file_name": "train/265.jpg", "text": "a car"}
+{"file_name": "train/266.jpg", "text": "a car"}
+{"file_name": "train/267.jpg", "text": "a car"}
+{"file_name": "train/268.jpg", "text": "a car"}
+{"file_name": "train/269.jpg", "text": "a car"}
+{"file_name": "train/270.jpg", "text": "a car"}
+{"file_name": "train/271.jpg", "text": "a car"}
+{"file_name": "train/272.jpg", "text": "a car"}
+{"file_name": "train/273.jpg", "text": "a car"}
+{"file_name": "train/274.jpg", "text": "a car"}
+{"file_name": "train/275.jpg", "text": "a car"}
+{"file_name": "train/276.jpg", "text": "a car"}
+{"file_name": "train/277.jpg", "text": "a car"}
+{"file_name": "train/278.jpg", "text": "a car"}
+{"file_name": "train/279.jpg", "text": "a car"}
+{"file_name": "train/280.jpg", "text": "a car"}
+{"file_name": "train/281.jpg", "text": "a car"}
+{"file_name": "train/282.jpg", "text": "a car"}
+{"file_name": "train/283.jpg", "text": "a car"}
+{"file_name": "train/284.jpg", "text": "a car"}
+{"file_name": "train/285.jpg", "text": "a car"}
+{"file_name": "train/286.jpg", "text": "a car"}
+{"file_name": "train/287.jpg", "text": "a car"}
+{"file_name": "train/288.jpg", "text": "a car"}
+{"file_name": "train/289.jpg", "text": "a car"}
+{"file_name": "train/290.jpg", "text": "a car"}
+{"file_name": "train/291.jpg", "text": "a car"}
+{"file_name": "train/292.jpg", "text": "a car"}
+{"file_name": "train/293.jpg", "text": "a car"}
+{"file_name": "train/294.jpg", "text": "a car"}
+{"file_name": "train/295.jpg", "text": "a car"}
+{"file_name": "train/296.jpg", "text": "a car"}
+{"file_name": "train/297.jpg", "text": "a car"}
+{"file_name": "train/298.jpg", "text": "a car"}
+{"file_name": "train/299.jpg", "text": "a car"}
+{"file_name": "train/300.jpg", "text": "a car"}
+{"file_name": "train/301.jpg", "text": "a car"}
+{"file_name": "train/302.jpg", "text": "a car"}
+{"file_name": "train/303.jpg", "text": "a car"}
+{"file_name": "train/304.jpg", "text": "a car"}
+{"file_name": "train/305.jpg", "text": "a car"}
+{"file_name": "train/306.jpg", "text": "a car"}
+{"file_name": "train/307.jpg", "text": "a car"}
+{"file_name": "train/308.jpg", "text": "a car"}
+{"file_name": "train/309.jpg", "text": "a car"}
+{"file_name": "train/310.jpg", "text": "a car"}
+{"file_name": "train/311.jpg", "text": "a car"}
+{"file_name": "train/312.jpg", "text": "a car"}
+{"file_name": "train/313.jpg", "text": "a car"}
+{"file_name": "train/314.jpg", "text": "a car"}
+{"file_name": "train/315.jpg", "text": "a car"}
+{"file_name": "train/316.jpg", "text": "a car"}
+{"file_name": "train/317.jpg", "text": "a car"}
+{"file_name": "train/318.jpg", "text": "a car"}
+{"file_name": "train/319.jpg", "text": "a car"}
+{"file_name": "train/320.jpg", "text": "a car"}
+{"file_name": "train/321.jpg", "text": "a car"}
+{"file_name": "train/322.jpg", "text": "a car"}
+{"file_name": "train/323.jpg", "text": "a car"}
+{"file_name": "train/324.jpg", "text": "a car"}
+{"file_name": "train/325.jpg", "text": "a car"}
+{"file_name": "train/326.jpg", "text": "a car"}
+{"file_name": "train/327.jpg", "text": "a car"}
+{"file_name": "train/328.jpg", "text": "a car"}
+{"file_name": "train/329.jpg", "text": "a car"}
+{"file_name": "train/330.jpg", "text": "a car"}
+{"file_name": "train/331.jpg", "text": "a car"}
+{"file_name": "train/332.jpg", "text": "a car"}
+{"file_name": "train/333.jpg", "text": "a car"}
+{"file_name": "train/334.jpg", "text": "a car"}
+{"file_name": "train/335.jpg", "text": "a car"}
+{"file_name": "train/336.jpg", "text": "a car"}
+{"file_name": "train/337.jpg", "text": "a car"}
+{"file_name": "train/338.jpg", "text": "a car"}
+{"file_name": "train/339.jpg", "text": "a car"}
+{"file_name": "train/340.jpg", "text": "a car"}
+{"file_name": "train/341.jpg", "text": "a car"}
+{"file_name": "train/342.jpg", "text": "a car"}
+{"file_name": "train/343.jpg", "text": "a car"}
+{"file_name": "train/344.jpg", "text": "a car"}
+{"file_name": "train/345.jpg", "text": "a car"}
+{"file_name": "train/346.jpg", "text": "a car"}
+{"file_name": "train/347.jpg", "text": "a car"}
+{"file_name": "train/348.jpg", "text": "a car"}
+{"file_name": "train/349.jpg", "text": "a car"}
+{"file_name": "train/350.jpg", "text": "a car"}
+{"file_name": "train/351.jpg", "text": "a car"}
+{"file_name": "train/352.jpg", "text": "a car"}
+{"file_name": "train/353.jpg", "text": "a car"}
+{"file_name": "train/354.jpg", "text": "a car"}
+{"file_name": "train/355.jpg", "text": "a car"}
+{"file_name": "train/356.jpg", "text": "a car"}
+{"file_name": "train/357.jpg", "text": "a car"}
+{"file_name": "train/358.jpg", "text": "a car"}
+{"file_name": "train/359.jpg", "text": "a car"}
+{"file_name": "train/360.jpg", "text": "a car"}
+{"file_name": "train/361.jpg", "text": "a car"}
+{"file_name": "train/362.jpg", "text": "a car"}
+{"file_name": "train/363.jpg", "text": "a car"}
+{"file_name": "train/364.jpg", "text": "a car"}
+{"file_name": "train/365.jpg", "text": "a car"}
+{"file_name": "train/366.jpg", "text": "a car"}
+{"file_name": "train/367.jpg", "text": "a car"}
+{"file_name": "train/368.jpg", "text": "a car"}
+{"file_name": "train/369.jpg", "text": "a car"}
+{"file_name": "train/370.jpg", "text": "a car"}
+{"file_name": "train/371.jpg", "text": "a car"}
+{"file_name": "train/372.jpg", "text": "a car"}
+{"file_name": "train/373.jpg", "text": "a car"}
+{"file_name": "train/374.jpg", "text": "a car"}
+{"file_name": "train/375.jpg", "text": "a car"}
+{"file_name": "train/376.jpg", "text": "a car"}
+{"file_name": "train/377.jpg", "text": "a car"}
+{"file_name": "train/378.jpg", "text": "a car"}
+{"file_name": "train/379.jpg", "text": "a car"}
+{"file_name": "train/380.jpg", "text": "a car"}
+{"file_name": "train/381.jpg", "text": "a car"}
+{"file_name": "train/382.jpg", "text": "a car"}
+{"file_name": "train/383.jpg", "text": "a car"}
+{"file_name": "train/384.jpg", "text": "a car"}
+{"file_name": "train/385.jpg", "text": "a car"}
+{"file_name": "train/386.jpg", "text": "a car"}
+{"file_name": "train/387.jpg", "text": "a car"}
+{"file_name": "train/388.jpg", "text": "a car"}
+{"file_name": "train/389.jpg", "text": "a car"}
+{"file_name": "train/390.jpg", "text": "a car"}
+{"file_name": "train/391.jpg", "text": "a car"}
+{"file_name": "train/392.jpg", "text": "a car"}
+{"file_name": "train/393.jpg", "text": "a car"}
+{"file_name": "train/394.jpg", "text": "a car"}
+{"file_name": "train/395.jpg", "text": "a car"}
+{"file_name": "train/396.jpg", "text": "a car"}
+{"file_name": "train/397.jpg", "text": "a car"}
+{"file_name": "train/398.jpg", "text": "a car"}
+{"file_name": "train/399.jpg", "text": "a car"}
+{"file_name": "train/400.jpg", "text": "a car"}
+{"file_name": "train/401.jpg", "text": "a car"}
+{"file_name": "train/402.jpg", "text": "a car"}
+{"file_name": "train/403.jpg", "text": "a car"}
+{"file_name": "train/404.jpg", "text": "a car"}
+{"file_name": "train/405.jpg", "text": "a car"}
+{"file_name": "train/406.jpg", "text": "a car"}
+{"file_name": "train/407.jpg", "text": "a car"}
+{"file_name": "train/408.jpg", "text": "a car"}
+{"file_name": "train/409.jpg", "text": "a car"}
+{"file_name": "train/410.jpg", "text": "a car"}
+{"file_name": "train/411.jpg", "text": "a car"}
+{"file_name": "train/412.jpg", "text": "a car"}
+{"file_name": "train/413.jpg", "text": "a car"}
+{"file_name": "train/414.jpg", "text": "a car"}
+{"file_name": "train/415.jpg", "text": "a car"}
+{"file_name": "train/416.jpg", "text": "a car"}
+{"file_name": "train/417.jpg", "text": "a car"}
+{"file_name": "train/418.jpg", "text": "a car"}
+{"file_name": "train/419.jpg", "text": "a car"}
+{"file_name": "train/420.jpg", "text": "a car"}
+{"file_name": "train/421.jpg", "text": "a car"}
+{"file_name": "train/422.jpg", "text": "a car"}
+{"file_name": "train/423.jpg", "text": "a car"}
+{"file_name": "train/424.jpg", "text": "a car"}
+{"file_name": "train/425.jpg", "text": "a car"}
+{"file_name": "train/426.jpg", "text": "a car"}
+{"file_name": "train/427.jpg", "text": "a car"}
+{"file_name": "train/428.jpg", "text": "a car"}
+{"file_name": "train/429.jpg", "text": "a car"}
+{"file_name": "train/430.jpg", "text": "a car"}
+{"file_name": "train/431.jpg", "text": "a car"}
+{"file_name": "train/432.jpg", "text": "a car"}
+{"file_name": "train/433.jpg", "text": "a car"}
+{"file_name": "train/434.jpg", "text": "a car"}
+{"file_name": "train/435.jpg", "text": "a car"}
+{"file_name": "train/436.jpg", "text": "a car"}
+{"file_name": "train/437.jpg", "text": "a car"}
+{"file_name": "train/438.jpg", "text": "a car"}
+{"file_name": "train/439.jpg", "text": "a car"}
+{"file_name": "train/440.jpg", "text": "a car"}
+{"file_name": "train/441.jpg", "text": "a car"}
+{"file_name": "train/442.jpg", "text": "a car"}
+{"file_name": "train/443.jpg", "text": "a car"}
+{"file_name": "train/444.jpg", "text": "a car"}
+{"file_name": "train/445.jpg", "text": "a car"}
+{"file_name": "train/446.jpg", "text": "a car"}
+{"file_name": "train/447.jpg", "text": "a car"}
+{"file_name": "train/448.jpg", "text": "a car"}
+{"file_name": "train/449.jpg", "text": "a car"}
+{"file_name": "train/450.jpg", "text": "a car"}
+{"file_name": "train/451.jpg", "text": "a car"}
+{"file_name": "train/452.jpg", "text": "a car"}
+{"file_name": "train/453.jpg", "text": "a car"}
+{"file_name": "train/454.jpg", "text": "a car"}
+{"file_name": "train/455.jpg", "text": "a car"}
+{"file_name": "train/456.jpg", "text": "a car"}
+{"file_name": "train/457.jpg", "text": "a car"}
+{"file_name": "train/458.jpg", "text": "a car"}
+{"file_name": "train/459.jpg", "text": "a car"}
+{"file_name": "train/460.jpg", "text": "a car"}
+{"file_name": "train/461.jpg", "text": "a car"}
+{"file_name": "train/462.jpg", "text": "a car"}
+{"file_name": "train/463.jpg", "text": "a car"}
+{"file_name": "train/464.jpg", "text": "a car"}
+{"file_name": "train/465.jpg", "text": "a car"}
+{"file_name": "train/466.jpg", "text": "a car"}
+{"file_name": "train/467.jpg", "text": "a car"}
+{"file_name": "train/468.jpg", "text": "a car"}
+{"file_name": "train/469.jpg", "text": "a car"}
+{"file_name": "train/470.jpg", "text": "a car"}
+{"file_name": "train/471.jpg", "text": "a car"}
+{"file_name": "train/472.jpg", "text": "a car"}
+{"file_name": "train/473.jpg", "text": "a car"}
+{"file_name": "train/474.jpg", "text": "a car"}
+{"file_name": "train/475.jpg", "text": "a car"}
+{"file_name": "train/476.jpg", "text": "a car"}
+{"file_name": "train/477.jpg", "text": "a car"}
+{"file_name": "train/478.jpg", "text": "a car"}
+{"file_name": "train/479.jpg", "text": "a car"}
+{"file_name": "train/480.jpg", "text": "a car"}
+{"file_name": "train/481.jpg", "text": "a car"}
+{"file_name": "train/482.jpg", "text": "a car"}
+{"file_name": "train/483.jpg", "text": "a car"}
+{"file_name": "train/484.jpg", "text": "a car"}
+{"file_name": "train/485.jpg", "text": "a car"}
+{"file_name": "train/486.jpg", "text": "a car"}
+{"file_name": "train/487.jpg", "text": "a car"}
+{"file_name": "train/488.jpg", "text": "a car"}
+{"file_name": "train/489.jpg", "text": "a car"}
+{"file_name": "train/490.jpg", "text": "a car"}
+{"file_name": "train/491.jpg", "text": "a car"}
+{"file_name": "train/492.jpg", "text": "a car"}
+{"file_name": "train/493.jpg", "text": "a car"}
+{"file_name": "train/494.jpg", "text": "a car"}
+{"file_name": "train/495.jpg", "text": "a car"}
+{"file_name": "train/496.jpg", "text": "a car"}
+{"file_name": "train/497.jpg", "text": "a car"}
+{"file_name": "train/498.jpg", "text": "a car"}
+{"file_name": "train/499.jpg", "text": "a car"}
+{"file_name": "train/500.jpg", "text": "a car"}
+{"file_name": "train/501.jpg", "text": "a car"}
+{"file_name": "train/502.jpg", "text": "a car"}
+{"file_name": "train/503.jpg", "text": "a car"}
+{"file_name": "train/504.jpg", "text": "a car"}
+{"file_name": "train/505.jpg", "text": "a car"}
+{"file_name": "train/506.jpg", "text": "a car"}
+{"file_name": "train/507.jpg", "text": "a car"}
+{"file_name": "train/508.jpg", "text": "a car"}
+{"file_name": "train/509.jpg", "text": "a car"}
+{"file_name": "train/510.jpg", "text": "a car"}
+{"file_name": "train/511.jpg", "text": "a car"}
+{"file_name": "train/512.jpg", "text": "a car"}
+{"file_name": "train/513.jpg", "text": "a car"}
+{"file_name": "train/514.jpg", "text": "a car"}
+{"file_name": "train/515.jpg", "text": "a car"}
+{"file_name": "train/516.jpg", "text": "a car"}
+{"file_name": "train/517.jpg", "text": "a car"}
+{"file_name": "train/518.jpg", "text": "a car"}
+{"file_name": "train/519.jpg", "text": "a car"}
+{"file_name": "train/520.jpg", "text": "a car"}
+{"file_name": "train/521.jpg", "text": "a car"}
+{"file_name": "train/522.jpg", "text": "a car"}
+{"file_name": "train/523.jpg", "text": "a car"}
+{"file_name": "train/524.jpg", "text": "a car"}
+{"file_name": "train/525.jpg", "text": "a car"}
+{"file_name": "train/526.jpg", "text": "a car"}
+{"file_name": "train/527.jpg", "text": "a car"}
+{"file_name": "train/528.jpg", "text": "a car"}
+{"file_name": "train/529.jpg", "text": "a car"}
+{"file_name": "train/530.jpg", "text": "a car"}
+{"file_name": "train/531.jpg", "text": "a car"}
+{"file_name": "train/532.jpg", "text": "a car"}
+{"file_name": "train/533.jpg", "text": "a car"}
+{"file_name": "train/534.jpg", "text": "a car"}
+{"file_name": "train/535.jpg", "text": "a car"}
+{"file_name": "train/536.jpg", "text": "a car"}
+{"file_name": "train/537.jpg", "text": "a car"}
+{"file_name": "train/538.jpg", "text": "a car"}
+{"file_name": "train/539.jpg", "text": "a car"}
+{"file_name": "train/540.jpg", "text": "a car"}
+{"file_name": "train/541.jpg", "text": "a car"}
+{"file_name": "train/542.jpg", "text": "a car"}
+{"file_name": "train/543.jpg", "text": "a car"}
+{"file_name": "train/544.jpg", "text": "a car"}
+{"file_name": "train/545.jpg", "text": "a car"}
+{"file_name": "train/546.jpg", "text": "a car"}
+{"file_name": "train/547.jpg", "text": "a car"}
+{"file_name": "train/548.jpg", "text": "a car"}
+{"file_name": "train/549.jpg", "text": "a car"}
+{"file_name": "train/550.jpg", "text": "a car"}
+{"file_name": "train/551.jpg", "text": "a car"}
+{"file_name": "train/552.jpg", "text": "a car"}
+{"file_name": "train/553.jpg", "text": "a car"}
+{"file_name": "train/554.jpg", "text": "a car"}
+{"file_name": "train/555.jpg", "text": "a car"}
+{"file_name": "train/556.jpg", "text": "a car"}
+{"file_name": "train/557.jpg", "text": "a car"}
+{"file_name": "train/558.jpg", "text": "a car"}
+{"file_name": "train/559.jpg", "text": "a car"}
+{"file_name": "train/560.jpg", "text": "a car"}
+{"file_name": "train/561.jpg", "text": "a car"}
+{"file_name": "train/562.jpg", "text": "a car"}
+{"file_name": "train/563.jpg", "text": "a car"}
+{"file_name": "train/564.jpg", "text": "a car"}
+{"file_name": "train/565.jpg", "text": "a car"}
+{"file_name": "train/566.jpg", "text": "a car"}
+{"file_name": "train/567.jpg", "text": "a car"}
+{"file_name": "train/568.jpg", "text": "a car"}
+{"file_name": "train/569.jpg", "text": "a car"}
+{"file_name": "train/570.jpg", "text": "a car"}
+{"file_name": "train/571.jpg", "text": "a car"}
+{"file_name": "train/572.jpg", "text": "a car"}
+{"file_name": "train/573.jpg", "text": "a car"}
+{"file_name": "train/574.jpg", "text": "a car"}
+{"file_name": "train/575.jpg", "text": "a car"}
+{"file_name": "train/576.jpg", "text": "a car"}
+{"file_name": "train/577.jpg", "text": "a car"}
+{"file_name": "train/578.jpg", "text": "a car"}
+{"file_name": "train/579.jpg", "text": "a car"}
+{"file_name": "train/580.jpg", "text": "a car"}
+{"file_name": "train/581.jpg", "text": "a car"}
+{"file_name": "train/582.jpg", "text": "a car"}
+{"file_name": "train/583.jpg", "text": "a car"}
+{"file_name": "train/584.jpg", "text": "a car"}
+{"file_name": "train/585.jpg", "text": "a car"}
+{"file_name": "train/586.jpg", "text": "a car"}
+{"file_name": "train/587.jpg", "text": "a car"}
+{"file_name": "train/588.jpg", "text": "a car"}
+{"file_name": "train/589.jpg", "text": "a car"}
+{"file_name": "train/590.jpg", "text": "a car"}
+{"file_name": "train/591.jpg", "text": "a car"}
+{"file_name": "train/592.jpg", "text": "a car"}
+{"file_name": "train/593.jpg", "text": "a car"}
+{"file_name": "train/594.jpg", "text": "a car"}
+{"file_name": "train/595.jpg", "text": "a car"}
+{"file_name": "train/596.jpg", "text": "a car"}
+{"file_name": "train/597.jpg", "text": "a car"}
+{"file_name": "train/598.jpg", "text": "a car"}
+{"file_name": "train/599.jpg", "text": "a car"}
+{"file_name": "train/600.jpg", "text": "a car"}
+{"file_name": "train/601.jpg", "text": "a car"}
+{"file_name": "train/602.jpg", "text": "a car"}
+{"file_name": "train/603.jpg", "text": "a car"}
+{"file_name": "train/604.jpg", "text": "a car"}
+{"file_name": "train/605.jpg", "text": "a car"}
+{"file_name": "train/606.jpg", "text": "a car"}
+{"file_name": "train/607.jpg", "text": "a car"}
+{"file_name": "train/608.jpg", "text": "a car"}
+{"file_name": "train/609.jpg", "text": "a car"}
+{"file_name": "train/610.jpg", "text": "a car"}
+{"file_name": "train/611.jpg", "text": "a car"}
+{"file_name": "train/612.jpg", "text": "a car"}
+{"file_name": "train/613.jpg", "text": "a car"}
+{"file_name": "train/614.jpg", "text": "a car"}
+{"file_name": "train/615.jpg", "text": "a car"}
+{"file_name": "train/616.jpg", "text": "a car"}
+{"file_name": "train/617.jpg", "text": "a car"}
+{"file_name": "train/618.jpg", "text": "a car"}
+{"file_name": "train/619.jpg", "text": "a car"}
+{"file_name": "train/620.jpg", "text": "a car"}
+{"file_name": "train/621.jpg", "text": "a car"}
+{"file_name": "train/622.jpg", "text": "a car"}
+{"file_name": "train/623.jpg", "text": "a car"}
+{"file_name": "train/624.jpg", "text": "a car"}
+{"file_name": "train/625.jpg", "text": "a car"}
+{"file_name": "train/626.jpg", "text": "a car"}
+{"file_name": "train/627.jpg", "text": "a car"}
+{"file_name": "train/628.jpg", "text": "a car"}
+{"file_name": "train/629.jpg", "text": "a car"}
+{"file_name": "train/630.jpg", "text": "a car"}
+{"file_name": "train/631.jpg", "text": "a car"}
+{"file_name": "train/632.jpg", "text": "a car"}
+{"file_name": "train/633.jpg", "text": "a car"}
+{"file_name": "train/634.jpg", "text": "a car"}
+{"file_name": "train/635.jpg", "text": "a car"}
+{"file_name": "train/636.jpg", "text": "a car"}
+{"file_name": "train/637.jpg", "text": "a car"}
+{"file_name": "train/638.jpg", "text": "a car"}
+{"file_name": "train/639.jpg", "text": "a car"}
+{"file_name": "train/640.jpg", "text": "a car"}
+{"file_name": "train/641.jpg", "text": "a car"}
+{"file_name": "train/642.jpg", "text": "a car"}
+{"file_name": "train/643.jpg", "text": "a car"}
+{"file_name": "train/644.jpg", "text": "a car"}
+{"file_name": "train/645.jpg", "text": "a car"}
+{"file_name": "train/646.jpg", "text": "a car"}
+{"file_name": "train/647.jpg", "text": "a car"}
+{"file_name": "train/648.jpg", "text": "a car"}
+{"file_name": "train/649.jpg", "text": "a car"}
+{"file_name": "train/650.jpg", "text": "a car"}
+{"file_name": "train/651.jpg", "text": "a car"}
+{"file_name": "train/652.jpg", "text": "a car"}
+{"file_name": "train/653.jpg", "text": "a car"}
+{"file_name": "train/654.jpg", "text": "a car"}
+{"file_name": "train/655.jpg", "text": "a car"}
+{"file_name": "train/656.jpg", "text": "a car"}
+{"file_name": "train/657.jpg", "text": "a car"}
+{"file_name": "train/658.jpg", "text": "a car"}
+{"file_name": "train/659.jpg", "text": "a car"}
+{"file_name": "train/660.jpg", "text": "a car"}
+{"file_name": "train/661.jpg", "text": "a car"}
+{"file_name": "train/662.jpg", "text": "a car"}
+{"file_name": "train/663.jpg", "text": "a car"}
+{"file_name": "train/664.jpg", "text": "a car"}
+{"file_name": "train/665.jpg", "text": "a car"}
+{"file_name": "train/666.jpg", "text": "a car"}
+{"file_name": "train/667.jpg", "text": "a car"}
+{"file_name": "train/668.jpg", "text": "a car"}
+{"file_name": "train/669.jpg", "text": "a car"}
+{"file_name": "train/670.jpg", "text": "a car"}
+{"file_name": "train/671.jpg", "text": "a car"}
+{"file_name": "train/672.jpg", "text": "a car"}
+{"file_name": "train/673.jpg", "text": "a car"}
+{"file_name": "train/674.jpg", "text": "a car"}
+{"file_name": "train/675.jpg", "text": "a car"}
+{"file_name": "train/676.jpg", "text": "a car"}
+{"file_name": "train/677.jpg", "text": "a car"}
+{"file_name": "train/678.jpg", "text": "a car"}
+{"file_name": "train/679.jpg", "text": "a car"}
+{"file_name": "train/680.jpg", "text": "a car"}
+{"file_name": "train/681.jpg", "text": "a car"}
+{"file_name": "train/682.jpg", "text": "a car"}
+{"file_name": "train/683.jpg", "text": "a car"}
+{"file_name": "train/684.jpg", "text": "a car"}
+{"file_name": "train/685.jpg", "text": "a car"}
+{"file_name": "train/686.jpg", "text": "a car"}
+{"file_name": "train/687.jpg", "text": "a car"}
+{"file_name": "train/688.jpg", "text": "a car"}
+{"file_name": "train/689.jpg", "text": "a car"}
+{"file_name": "train/690.jpg", "text": "a car"}
+{"file_name": "train/691.jpg", "text": "a car"}
+{"file_name": "train/692.jpg", "text": "a car"}
+{"file_name": "train/693.jpg", "text": "a car"}
+{"file_name": "train/694.jpg", "text": "a car"}
+{"file_name": "train/695.jpg", "text": "a car"}
+{"file_name": "train/696.jpg", "text": "a car"}
+{"file_name": "train/697.jpg", "text": "a car"}
+{"file_name": "train/698.jpg", "text": "a car"}
+{"file_name": "train/699.jpg", "text": "a car"}
+{"file_name": "train/700.jpg", "text": "a car"}
+{"file_name": "train/701.jpg", "text": "a car"}
+{"file_name": "train/702.jpg", "text": "a car"}
+{"file_name": "train/703.jpg", "text": "a car"}
+{"file_name": "train/704.jpg", "text": "a car"}
+{"file_name": "train/705.jpg", "text": "a car"}
+{"file_name": "train/706.jpg", "text": "a car"}
+{"file_name": "train/707.jpg", "text": "a car"}
+{"file_name": "train/708.jpg", "text": "a car"}
+{"file_name": "train/709.jpg", "text": "a car"}
+{"file_name": "train/710.jpg", "text": "a car"}
+{"file_name": "train/711.jpg", "text": "a car"}
+{"file_name": "train/712.jpg", "text": "a car"}
+{"file_name": "train/713.jpg", "text": "a car"}
+{"file_name": "train/714.jpg", "text": "a car"}
+{"file_name": "train/715.jpg", "text": "a car"}
+{"file_name": "train/716.jpg", "text": "a car"}
+{"file_name": "train/717.jpg", "text": "a car"}
+{"file_name": "train/718.jpg", "text": "a car"}
+{"file_name": "train/719.jpg", "text": "a car"}
+{"file_name": "train/720.jpg", "text": "a car"}
+{"file_name": "train/721.jpg", "text": "a car"}
+{"file_name": "train/722.jpg", "text": "a car"}
+{"file_name": "train/723.jpg", "text": "a car"}
+{"file_name": "train/724.jpg", "text": "a car"}
+{"file_name": "train/725.jpg", "text": "a car"}
+{"file_name": "train/726.jpg", "text": "a car"}
+{"file_name": "train/727.jpg", "text": "a car"}
+{"file_name": "train/728.jpg", "text": "a car"}
+{"file_name": "train/729.jpg", "text": "a car"}
+{"file_name": "train/730.jpg", "text": "a car"}
+{"file_name": "train/731.jpg", "text": "a car"}
+{"file_name": "train/732.jpg", "text": "a car"}
+{"file_name": "train/733.jpg", "text": "a car"}
+{"file_name": "train/734.jpg", "text": "a car"}
+{"file_name": "train/735.jpg", "text": "a car"}
+{"file_name": "train/736.jpg", "text": "a car"}
+{"file_name": "train/737.jpg", "text": "a car"}
+{"file_name": "train/738.jpg", "text": "a car"}
+{"file_name": "train/739.jpg", "text": "a car"}
+{"file_name": "train/740.jpg", "text": "a car"}
+{"file_name": "train/741.jpg", "text": "a car"}
+{"file_name": "train/742.jpg", "text": "a car"}
+{"file_name": "train/743.jpg", "text": "a car"}
+{"file_name": "train/744.jpg", "text": "a car"}
+{"file_name": "train/745.jpg", "text": "a car"}
+{"file_name": "train/746.jpg", "text": "a car"}
+{"file_name": "train/747.jpg", "text": "a car"}
+{"file_name": "train/748.jpg", "text": "a car"}
+{"file_name": "train/749.jpg", "text": "a car"}
+{"file_name": "train/750.jpg", "text": "a car"}
+{"file_name": "train/751.jpg", "text": "a car"}
+{"file_name": "train/752.jpg", "text": "a car"}
+{"file_name": "train/753.jpg", "text": "a car"}
+{"file_name": "train/754.jpg", "text": "a car"}
+{"file_name": "train/755.jpg", "text": "a car"}
+{"file_name": "train/756.jpg", "text": "a car"}
+{"file_name": "train/757.jpg", "text": "a car"}
+{"file_name": "train/758.jpg", "text": "a car"}
+{"file_name": "train/759.jpg", "text": "a car"}
+{"file_name": "train/760.jpg", "text": "a car"}
+{"file_name": "train/761.jpg", "text": "a car"}
+{"file_name": "train/762.jpg", "text": "a car"}
+{"file_name": "train/763.jpg", "text": "a car"}
+{"file_name": "train/764.jpg", "text": "a car"}
+{"file_name": "train/765.jpg", "text": "a car"}
+{"file_name": "train/766.jpg", "text": "a car"}
+{"file_name": "train/767.jpg", "text": "a car"}
+{"file_name": "train/768.jpg", "text": "a car"}
+{"file_name": "train/769.jpg", "text": "a car"}
+{"file_name": "train/770.jpg", "text": "a car"}
+{"file_name": "train/771.jpg", "text": "a car"}
+{"file_name": "train/772.jpg", "text": "a car"}
+{"file_name": "train/773.jpg", "text": "a car"}
+{"file_name": "train/774.jpg", "text": "a car"}
+{"file_name": "train/775.jpg", "text": "a car"}
+{"file_name": "train/776.jpg", "text": "a car"}
+{"file_name": "train/777.jpg", "text": "a car"}
+{"file_name": "train/778.jpg", "text": "a car"}
+{"file_name": "train/779.jpg", "text": "a car"}
+{"file_name": "train/780.jpg", "text": "a car"}
+{"file_name": "train/781.jpg", "text": "a car"}
+{"file_name": "train/782.jpg", "text": "a car"}
+{"file_name": "train/783.jpg", "text": "a car"}
+{"file_name": "train/784.jpg", "text": "a car"}
+{"file_name": "train/785.jpg", "text": "a car"}
+{"file_name": "train/786.jpg", "text": "a car"}
+{"file_name": "train/787.jpg", "text": "a car"}
+{"file_name": "train/788.jpg", "text": "a car"}
+{"file_name": "train/789.jpg", "text": "a car"}
+{"file_name": "train/790.jpg", "text": "a car"}
+{"file_name": "train/791.jpg", "text": "a car"}
+{"file_name": "train/792.jpg", "text": "a car"}
+{"file_name": "train/793.jpg", "text": "a car"}
+{"file_name": "train/794.jpg", "text": "a car"}
+{"file_name": "train/795.jpg", "text": "a car"}
+{"file_name": "train/796.jpg", "text": "a car"}
+{"file_name": "train/797.jpg", "text": "a car"}
+{"file_name": "train/798.jpg", "text": "a car"}
+{"file_name": "train/799.jpg", "text": "a car"}
+{"file_name": "train/800.jpg", "text": "a car"}
+{"file_name": "train/801.jpg", "text": "a car"}
+{"file_name": "train/802.jpg", "text": "a car"}
+{"file_name": "train/803.jpg", "text": "a car"}
+{"file_name": "train/804.jpg", "text": "a car"}
+{"file_name": "train/805.jpg", "text": "a car"}
+{"file_name": "train/806.jpg", "text": "a car"}
+{"file_name": "train/807.jpg", "text": "a car"}
+{"file_name": "train/808.jpg", "text": "a car"}
+{"file_name": "train/809.jpg", "text": "a car"}
+{"file_name": "train/810.jpg", "text": "a car"}
+{"file_name": "train/811.jpg", "text": "a car"}
+{"file_name": "train/812.jpg", "text": "a car"}
+{"file_name": "train/813.jpg", "text": "a car"}
+{"file_name": "train/814.jpg", "text": "a car"}
+{"file_name": "train/815.jpg", "text": "a car"}
+{"file_name": "train/816.jpg", "text": "a car"}
+{"file_name": "train/817.jpg", "text": "a car"}
+{"file_name": "train/818.jpg", "text": "a car"}
+{"file_name": "train/819.jpg", "text": "a car"}
+{"file_name": "train/820.jpg", "text": "a car"}
+{"file_name": "train/821.jpg", "text": "a car"}
+{"file_name": "train/822.jpg", "text": "a car"}
+{"file_name": "train/823.jpg", "text": "a car"}
+{"file_name": "train/824.jpg", "text": "a car"}
+{"file_name": "train/825.jpg", "text": "a car"}
+{"file_name": "train/826.jpg", "text": "a car"}
+{"file_name": "train/827.jpg", "text": "a car"}
+{"file_name": "train/828.jpg", "text": "a car"}
+{"file_name": "train/829.jpg", "text": "a car"}
+{"file_name": "train/830.jpg", "text": "a car"}
+{"file_name": "train/831.jpg", "text": "a car"}
+{"file_name": "train/832.jpg", "text": "a car"}
+{"file_name": "train/833.jpg", "text": "a car"}
+{"file_name": "train/834.jpg", "text": "a car"}
+{"file_name": "train/835.jpg", "text": "a car"}
+{"file_name": "train/836.jpg", "text": "a car"}
+{"file_name": "train/837.jpg", "text": "a car"}
+{"file_name": "train/838.jpg", "text": "a car"}
+{"file_name": "train/839.jpg", "text": "a car"}
+{"file_name": "train/840.jpg", "text": "a car"}
+{"file_name": "train/841.jpg", "text": "a car"}
+{"file_name": "train/842.jpg", "text": "a car"}
+{"file_name": "train/843.jpg", "text": "a car"}
+{"file_name": "train/844.jpg", "text": "a car"}
+{"file_name": "train/845.jpg", "text": "a car"}
+{"file_name": "train/846.jpg", "text": "a car"}
+{"file_name": "train/847.jpg", "text": "a car"}
+{"file_name": "train/848.jpg", "text": "a car"}
+{"file_name": "train/849.jpg", "text": "a car"}
+{"file_name": "train/850.jpg", "text": "a car"}
+{"file_name": "train/851.jpg", "text": "a car"}
+{"file_name": "train/852.jpg", "text": "a car"}
+{"file_name": "train/853.jpg", "text": "a car"}
+{"file_name": "train/854.jpg", "text": "a car"}
+{"file_name": "train/855.jpg", "text": "a car"}
+{"file_name": "train/856.jpg", "text": "a car"}
+{"file_name": "train/857.jpg", "text": "a car"}
+{"file_name": "train/858.jpg", "text": "a car"}
+{"file_name": "train/859.jpg", "text": "a car"}
+{"file_name": "train/860.jpg", "text": "a car"}
+{"file_name": "train/861.jpg", "text": "a car"}
+{"file_name": "train/862.jpg", "text": "a car"}
+{"file_name": "train/863.jpg", "text": "a car"}
+{"file_name": "train/864.jpg", "text": "a car"}
+{"file_name": "train/865.jpg", "text": "a car"}
+{"file_name": "train/866.jpg", "text": "a car"}
+{"file_name": "train/867.jpg", "text": "a car"}
+{"file_name": "train/868.jpg", "text": "a car"}
+{"file_name": "train/869.jpg", "text": "a car"}
+{"file_name": "train/870.jpg", "text": "a car"}
+{"file_name": "train/871.jpg", "text": "a car"}
+{"file_name": "train/872.jpg", "text": "a car"}
+{"file_name": "train/873.jpg", "text": "a car"}
+{"file_name": "train/874.jpg", "text": "a car"}
+{"file_name": "train/875.jpg", "text": "a car"}
+{"file_name": "train/876.jpg", "text": "a car"}
+{"file_name": "train/877.jpg", "text": "a car"}
+{"file_name": "train/878.jpg", "text": "a car"}
+{"file_name": "train/879.jpg", "text": "a car"}
+{"file_name": "train/880.jpg", "text": "a car"}
+{"file_name": "train/881.jpg", "text": "a car"}
+{"file_name": "train/882.jpg", "text": "a car"}
+{"file_name": "train/883.jpg", "text": "a car"}
+{"file_name": "train/884.jpg", "text": "a car"}
+{"file_name": "train/885.jpg", "text": "a car"}
+{"file_name": "train/886.jpg", "text": "a car"}
+{"file_name": "train/887.jpg", "text": "a car"}
+{"file_name": "train/888.jpg", "text": "a car"}
+{"file_name": "train/889.jpg", "text": "a car"}
+{"file_name": "train/890.jpg", "text": "a car"}
+{"file_name": "train/891.jpg", "text": "a car"}
+{"file_name": "train/892.jpg", "text": "a car"}
+{"file_name": "train/893.jpg", "text": "a car"}
+{"file_name": "train/894.jpg", "text": "a car"}
+{"file_name": "train/895.jpg", "text": "a car"}
+{"file_name": "train/896.jpg", "text": "a car"}
+{"file_name": "train/897.jpg", "text": "a car"}
+{"file_name": "train/898.jpg", "text": "a car"}
+{"file_name": "train/899.jpg", "text": "a car"}
+{"file_name": "train/900.jpg", "text": "a car"}
+{"file_name": "train/901.jpg", "text": "a car"}
+{"file_name": "train/902.jpg", "text": "a car"}
+{"file_name": "train/903.jpg", "text": "a car"}
+{"file_name": "train/904.jpg", "text": "a car"}
+{"file_name": "train/905.jpg", "text": "a car"}
+{"file_name": "train/906.jpg", "text": "a car"}
+{"file_name": "train/907.jpg", "text": "a car"}
+{"file_name": "train/908.jpg", "text": "a car"}
+{"file_name": "train/909.jpg", "text": "a car"}
+{"file_name": "train/910.jpg", "text": "a car"}
+{"file_name": "train/911.jpg", "text": "a car"}
+{"file_name": "train/912.jpg", "text": "a car"}
+{"file_name": "train/913.jpg", "text": "a car"}
+{"file_name": "train/914.jpg", "text": "a car"}
+{"file_name": "train/915.jpg", "text": "a car"}
+{"file_name": "train/916.jpg", "text": "a car"}
+{"file_name": "train/917.jpg", "text": "a car"}
+{"file_name": "train/918.jpg", "text": "a car"}
+{"file_name": "train/919.jpg", "text": "a car"}
+{"file_name": "train/920.jpg", "text": "a car"}
+{"file_name": "train/921.jpg", "text": "a car"}
+{"file_name": "train/922.jpg", "text": "a car"}
+{"file_name": "train/923.jpg", "text": "a car"}
+{"file_name": "train/924.jpg", "text": "a car"}
+{"file_name": "train/925.jpg", "text": "a car"}
+{"file_name": "train/926.jpg", "text": "a car"}
+{"file_name": "train/927.jpg", "text": "a car"}
+{"file_name": "train/928.jpg", "text": "a car"}
+{"file_name": "train/929.jpg", "text": "a car"}
+{"file_name": "train/930.jpg", "text": "a car"}
+{"file_name": "train/931.jpg", "text": "a car"}
+{"file_name": "train/932.jpg", "text": "a car"}
+{"file_name": "train/933.jpg", "text": "a car"}
+{"file_name": "train/934.jpg", "text": "a car"}
+{"file_name": "train/935.jpg", "text": "a car"}
+{"file_name": "train/936.jpg", "text": "a car"}
+{"file_name": "train/937.jpg", "text": "a car"}
+{"file_name": "train/938.jpg", "text": "a car"}
+{"file_name": "train/939.jpg", "text": "a car"}
+{"file_name": "train/940.jpg", "text": "a car"}
+{"file_name": "train/941.jpg", "text": "a car"}
+{"file_name": "train/942.jpg", "text": "a car"}
+{"file_name": "train/943.jpg", "text": "a car"}
+{"file_name": "train/944.jpg", "text": "a car"}
+{"file_name": "train/945.jpg", "text": "a car"}
+{"file_name": "train/946.jpg", "text": "a car"}
+{"file_name": "train/947.jpg", "text": "a car"}
+{"file_name": "train/948.jpg", "text": "a car"}
+{"file_name": "train/949.jpg", "text": "a car"}
+{"file_name": "train/950.jpg", "text": "a car"}
+{"file_name": "train/951.jpg", "text": "a car"}
+{"file_name": "train/952.jpg", "text": "a car"}
+{"file_name": "train/953.jpg", "text": "a car"}
+{"file_name": "train/954.jpg", "text": "a car"}
+{"file_name": "train/955.jpg", "text": "a car"}
+{"file_name": "train/956.jpg", "text": "a car"}
+{"file_name": "train/957.jpg", "text": "a car"}
+{"file_name": "train/958.jpg", "text": "a car"}
+{"file_name": "train/959.jpg", "text": "a car"}
+{"file_name": "train/960.jpg", "text": "a car"}
+{"file_name": "train/961.jpg", "text": "a car"}
+{"file_name": "train/962.jpg", "text": "a car"}
+{"file_name": "train/963.jpg", "text": "a car"}
+{"file_name": "train/964.jpg", "text": "a car"}
+{"file_name": "train/965.jpg", "text": "a car"}
+{"file_name": "train/966.jpg", "text": "a car"}
+{"file_name": "train/967.jpg", "text": "a car"}
+{"file_name": "train/968.jpg", "text": "a car"}
+{"file_name": "train/969.jpg", "text": "a car"}
+{"file_name": "train/970.jpg", "text": "a car"}
+{"file_name": "train/971.jpg", "text": "a car"}
+{"file_name": "train/972.jpg", "text": "a car"}
+{"file_name": "train/973.jpg", "text": "a car"}
+{"file_name": "train/974.jpg", "text": "a car"}
+{"file_name": "train/975.jpg", "text": "a car"}
+{"file_name": "train/976.jpg", "text": "a car"}
+{"file_name": "train/977.jpg", "text": "a car"}
+{"file_name": "train/978.jpg", "text": "a car"}
+{"file_name": "train/979.jpg", "text": "a car"}
+{"file_name": "train/980.jpg", "text": "a car"}
+{"file_name": "train/981.jpg", "text": "a car"}
+{"file_name": "train/982.jpg", "text": "a car"}
+{"file_name": "train/983.jpg", "text": "a car"}
+{"file_name": "train/984.jpg", "text": "a car"}
+{"file_name": "train/985.jpg", "text": "a car"}
+{"file_name": "train/986.jpg", "text": "a car"}
+{"file_name": "train/987.jpg", "text": "a car"}
+{"file_name": "train/988.jpg", "text": "a car"}
+{"file_name": "train/989.jpg", "text": "a car"}
+{"file_name": "train/990.jpg", "text": "a car"}
+{"file_name": "train/991.jpg", "text": "a car"}
+{"file_name": "train/992.jpg", "text": "a car"}
+{"file_name": "train/993.jpg", "text": "a car"}
+{"file_name": "train/994.jpg", "text": "a car"}
+{"file_name": "train/995.jpg", "text": "a car"}
+{"file_name": "train/996.jpg", "text": "a car"}
+{"file_name": "train/997.jpg", "text": "a car"}
+{"file_name": "train/998.jpg", "text": "a car"}
+{"file_name": "train/999.jpg", "text": "a car"}
+{"file_name": "train/1000.jpg", "text": "a car"}

Gradient_ascent_traininig_scripts/data/car/train/fix.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import json
+# Define the range and the common text description
+start, end = 1, 1000
+description = "a car"
+# Open the metadata.jsonl file to write the JSON data
+with open("metadata.jsonl", "w") as file:
+    # Iterate through the range and format each entry
+    for i in range(start, end + 1):
+        entry = {
+            "file_name": f"train/{i}.jpg",
+            "text": description
+        }
+        # Write each entry as a JSON line
+        file.write(json.dumps(entry) + "\n")

Gradient_ascent_traininig_scripts/generate_images.sh ADDED Viewed

	@@ -0,0 +1,75 @@

+# OUTPUT_DIR="./data/english_springer_ti"
+# PROMPT="a photo of an english springer"
+# NUM_TRAIN_IMAGES=100
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode train \
+#     --num_train_images $NUM_TRAIN_IMAGES
+# OUTPUT_DIR="./data/garbage_truck_ti"
+# PROMPT="a photo of a garbage truck"
+# NUM_TRAIN_IMAGES=100
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode train \
+#     --num_train_images $NUM_TRAIN_IMAGES
+# OUTPUT_DIR="./data/kilian_eng_ti"
+# PROMPT="a painting in the style of Kilian Eng"
+# NUM_TRAIN_IMAGES=100
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode train \
+#     --num_train_images $NUM_TRAIN_IMAGES
+# OUTPUT_DIR="./data/kilian_eng_ti"
+# PROMPT="a painting in the style of Thomas Kinkade"
+# NUM_TRAIN_IMAGES=100
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode train \
+#     --num_train_images $NUM_TRAIN_IMAGES
+# OUTPUT_DIR="./data/van_gogh_ti"
+# PROMPT="a painting in the style of Van Gogh"
+# NUM_TRAIN_IMAGES=100
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode train \
+#     --num_train_images $NUM_TRAIN_IMAGES
+OUTPUT_DIR="./generation/english_springer_erasure"
+PROMPT="a photo of an english springer spaniel"
+NUM_TRAIN_IMAGES=100
+python3 generate_training_images.py \
+    --output_dir $OUTPUT_DIR \
+    --prompt "$PROMPT" \
+    --mode train \
+    --num_train_images $NUM_TRAIN_IMAGES
+# PROMPT="a photo of a golden retriever"
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode test \
+#     --model_path "./checkpoint/english_springer_erasure" \
+#     --num_train_images $NUM_TRAIN_IMAGES
+# PROMPT="a photo of a american pit bull terrier"
+# python3 generate_training_images.py \
+#     --output_dir $OUTPUT_DIR \
+#     --prompt "$PROMPT" \
+#     --mode test \
+#     --model_path "./checkpoint/english_springer_erasure" \
+#     --num_train_images $NUM_TRAIN_IMAGES

Gradient_ascent_traininig_scripts/generate_training_images.py ADDED Viewed

	@@ -0,0 +1,75 @@

+from datasets import load_dataset
+from diffusers import StableDiffusionPipeline
+import torch
+import os
+import json
+from PIL import Image
+import argparse
+def parse_args():
+    parser = argparse.ArgumentParser(description="Generate images from I2P dataset")
+    parser.add_argument("--output_dir", type=str, help="Output directory")
+    parser.add_argument("--model_path", type=str, help="Path to model checkpoint", default="CompVis/stable-diffusion-v1-4")
+    parser.add_argument("--seed", type=int, help="Seed for random number generator", default=0)
+    parser.add_argument("--prompt", type=str, help="Prompt for image generation")
+    parser.add_argument("--mode", type=str, help="Mode for image generation", choices=["train","test"], default="train")
+    parser.add_argument("--num_train_images", type=int, help="Number of images to generate for training", default=1000)
+    args = parser.parse_args()
+    return args
+if __name__ == "__main__":
+    args = parse_args()
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    if(args.mode == "test"):
+        metadata = []
+        os.makedirs(args.output_dir, exist_ok=True)
+        pipe = StableDiffusionPipeline.from_pretrained(args.model_path, safety_checker=None, torch_dtype=torch.float16).to(device)
+        for i in range(args.num_train_images):
+            while True:
+                output = pipe(prompt=args.prompt)
+                image = output.images[0]
+                nsfw = output.nsfw_content_detected
+                #check if nsfw is a list
+                if isinstance(nsfw, list):
+                    nsfw = nsfw[0]
+                if not nsfw:
+                    break
+            image.save(os.path.join(args.output_dir, f"{args.prompt}_{i}.png"))
+    elif(args.mode == "train"):
+        metadata = []
+        os.makedirs(args.output_dir, exist_ok=True)
+        os.makedirs(os.path.join(args.output_dir, "train"), exist_ok=True)
+        pipe = StableDiffusionPipeline.from_pretrained(args.model_path, safety_checker=None, torch_dtype=torch.float16).to(device)
+        for i in range(args.num_train_images):
+            while True:
+                output = pipe(prompt=args.prompt)
+                image = output.images[0]
+                nsfw = output.nsfw_content_detected
+                #check if nsfw is a list
+                if isinstance(nsfw, list):
+                    nsfw = nsfw[0]
+                if not nsfw:
+                    break
+            image.save(os.path.join(args.output_dir, "train", f"{args.prompt}_{i}.png"))
+            metadata.append({"file_name": f"train/{args.prompt}_{i}.png", "text": args.prompt})
+        with open(os.path.join(args.output_dir, 'metadata.jsonl'), 'w') as f:
+            for m in metadata:
+                f.write(json.dumps(m) + "\n")

Gradient_ascent_traininig_scripts/generation/english_springer_erasure/metadata.jsonl ADDED Viewed

	@@ -0,0 +1,100 @@

+{"file_name": "train/a photo of an english springer spaniel_0.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_1.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_2.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_3.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_4.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_5.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_6.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_7.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_8.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_9.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_10.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_11.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_12.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_13.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_14.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_15.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_16.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_17.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_18.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_19.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_20.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_21.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_22.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_23.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_24.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_25.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_26.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_27.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_28.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_29.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_30.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_31.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_32.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_33.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_34.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_35.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_36.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_37.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_38.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_39.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_40.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_41.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_42.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_43.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_44.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_45.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_46.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_47.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_48.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_49.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_50.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_51.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_52.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_53.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_54.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_55.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_56.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_57.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_58.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_59.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_60.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_61.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_62.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_63.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_64.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_65.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_66.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_67.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_68.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_69.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_70.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_71.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_72.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_73.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_74.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_75.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_76.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_77.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_78.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_79.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_80.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_81.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_82.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_83.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_84.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_85.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_86.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_87.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_88.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_89.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_90.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_91.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_92.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_93.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_94.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_95.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_96.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_97.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_98.png", "text": "a photo of an english springer spaniel"}
+{"file_name": "train/a photo of an english springer spaniel_99.png", "text": "a photo of an english springer spaniel"}

Gradient_ascent_traininig_scripts/inversion.sh ADDED Viewed

	@@ -0,0 +1,60 @@

+export MODEL_NAME="./checkpoint/van_gogh_erasure"
+export DATA_DIR="./data/van_gogh_ti/train"
+accelerate launch textual_inversion.py \
+  --pretrained_model_name_or_path=$MODEL_NAME \
+  --train_data_dir=$DATA_DIR \
+  --learnable_property="style" \
+  --placeholder_token="<art-style>" \
+  --initializer_token="art" \
+  --resolution=512 \
+  --train_batch_size=1 \
+  --gradient_accumulation_steps=4 \
+  --max_train_steps=5000 \
+  --learning_rate=5.0e-04 \
+  --scale_lr \
+  --lr_scheduler="constant" \
+  --lr_warmup_steps=0 \
+  --push_to_hub \
+  --output_dir="./checkpoint/van_gogh_inversion"
+export MODEL_NAME="./checkpoint/kilian_eng_erasure"
+export DATA_DIR="./data/kilian_eng_ti/train"
+accelerate launch textual_inversion.py \
+  --pretrained_model_name_or_path=$MODEL_NAME \
+  --train_data_dir=$DATA_DIR \
+  --learnable_property="style" \
+  --placeholder_token="<art-style>" \
+  --initializer_token="art" \
+  --resolution=512 \
+  --train_batch_size=1 \
+  --gradient_accumulation_steps=4 \
+  --max_train_steps=5000 \
+  --learning_rate=5.0e-04 \
+  --scale_lr \
+  --lr_scheduler="constant" \
+  --lr_warmup_steps=0 \
+  --push_to_hub \
+  --output_dir="./checkpoint/kilian_eng_inversion"
+export MODEL_NAME="./checkpoint/thomas_kinkade_erasure"
+export DATA_DIR="./data/thomas_kinkade_ti/train"
+accelerate launch textual_inversion.py \
+  --pretrained_model_name_or_path=$MODEL_NAME \
+  --train_data_dir=$DATA_DIR \
+  --learnable_property="style" \
+  --placeholder_token="<art-style>" \
+  --initializer_token="art" \
+  --resolution=512 \
+  --train_batch_size=1 \
+  --gradient_accumulation_steps=4 \
+  --max_train_steps=5000 \
+  --learning_rate=5.0e-04 \
+  --scale_lr \
+  --lr_scheduler="constant" \
+  --lr_warmup_steps=0 \
+  --push_to_hub \
+  --output_dir="./checkpoint/thomas_kinkade_inversion"

Gradient_ascent_traininig_scripts/textual_inversion.py ADDED Viewed

	@@ -0,0 +1,1022 @@

+#!/usr/bin/env python
+# coding=utf-8
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+import argparse
+import logging
+import math
+import os
+import random
+import shutil
+import warnings
+from contextlib import nullcontext
+from pathlib import Path
+import numpy as np
+import PIL
+import safetensors
+import torch
+import torch.nn.functional as F
+import torch.utils.checkpoint
+import transformers
+from accelerate import Accelerator
+from accelerate.logging import get_logger
+from accelerate.utils import ProjectConfiguration, set_seed
+from huggingface_hub import create_repo, upload_folder
+# TODO: remove and import from diffusers.utils when the new version of diffusers is released
+from packaging import version
+from PIL import Image
+from torch.utils.data import Dataset
+from torchvision import transforms
+from tqdm.auto import tqdm
+from transformers import CLIPTextModel, CLIPTokenizer
+import diffusers
+from diffusers import (
+    AutoencoderKL,
+    DDPMScheduler,
+    DiffusionPipeline,
+    DPMSolverMultistepScheduler,
+    StableDiffusionPipeline,
+    UNet2DConditionModel,
+)
+from diffusers.optimization import get_scheduler
+from diffusers.utils import check_min_version, is_wandb_available
+from diffusers.utils.hub_utils import load_or_create_model_card, populate_model_card
+from diffusers.utils.import_utils import is_xformers_available
+if is_wandb_available():
+    import wandb
+if version.parse(version.parse(PIL.__version__).base_version) >= version.parse("9.1.0"):
+    PIL_INTERPOLATION = {
+        "linear": PIL.Image.Resampling.BILINEAR,
+        "bilinear": PIL.Image.Resampling.BILINEAR,
+        "bicubic": PIL.Image.Resampling.BICUBIC,
+        "lanczos": PIL.Image.Resampling.LANCZOS,
+        "nearest": PIL.Image.Resampling.NEAREST,
+    }
+else:
+    PIL_INTERPOLATION = {
+        "linear": PIL.Image.LINEAR,
+        "bilinear": PIL.Image.BILINEAR,
+        "bicubic": PIL.Image.BICUBIC,
+        "lanczos": PIL.Image.LANCZOS,
+        "nearest": PIL.Image.NEAREST,
+    }
+# ------------------------------------------------------------------------------
+# Will error if the minimal version of diffusers is not installed. Remove at your own risks.
+check_min_version("0.31.0.dev0")
+logger = get_logger(__name__)
+def save_model_card(repo_id: str, images: list = None, base_model: str = None, repo_folder: str = None):
+    img_str = ""
+    if images is not None:
+        for i, image in enumerate(images):
+            image.save(os.path.join(repo_folder, f"image_{i}.png"))
+            img_str += f"![img_{i}](./image_{i}.png)\n"
+    model_description = f"""
+# Textual inversion text2image fine-tuning - {repo_id}
+These are textual inversion adaption weights for {base_model}. You can find some example images in the following. \n
+{img_str}
+"""
+    model_card = load_or_create_model_card(
+        repo_id_or_path=repo_id,
+        from_training=True,
+        license="creativeml-openrail-m",
+        base_model=base_model,
+        model_description=model_description,
+        inference=True,
+    )
+    tags = [
+        "stable-diffusion",
+        "stable-diffusion-diffusers",
+        "text-to-image",
+        "diffusers",
+        "textual_inversion",
+        "diffusers-training",
+    ]
+    model_card = populate_model_card(model_card, tags=tags)
+    model_card.save(os.path.join(repo_folder, "README.md"))
+def log_validation(text_encoder, tokenizer, unet, vae, args, accelerator, weight_dtype, epoch):
+    logger.info(
+        f"Running validation... \n Generating {args.num_validation_images} images with prompt:"
+        f" {args.validation_prompt}."
+    )
+    # create pipeline (note: unet and vae are loaded again in float32)
+    pipeline = DiffusionPipeline.from_pretrained(
+        args.pretrained_model_name_or_path,
+        text_encoder=accelerator.unwrap_model(text_encoder),
+        tokenizer=tokenizer,
+        unet=unet,
+        vae=vae,
+        safety_checker=None,
+        revision=args.revision,
+        variant=args.variant,
+        torch_dtype=weight_dtype,
+    )
+    pipeline.scheduler = DPMSolverMultistepScheduler.from_config(pipeline.scheduler.config)
+    pipeline = pipeline.to(accelerator.device)
+    pipeline.set_progress_bar_config(disable=True)
+    # run inference
+    generator = None if args.seed is None else torch.Generator(device=accelerator.device).manual_seed(args.seed)
+    images = []
+    for _ in range(args.num_validation_images):
+        if torch.backends.mps.is_available():
+            autocast_ctx = nullcontext()
+        else:
+            autocast_ctx = torch.autocast(accelerator.device.type)
+        with autocast_ctx:
+            image = pipeline(args.validation_prompt, num_inference_steps=25, generator=generator).images[0]
+        images.append(image)
+    for tracker in accelerator.trackers:
+        if tracker.name == "tensorboard":
+            np_images = np.stack([np.asarray(img) for img in images])
+            tracker.writer.add_images("validation", np_images, epoch, dataformats="NHWC")
+        if tracker.name == "wandb":
+            tracker.log(
+                {
+                    "validation": [
+                        wandb.Image(image, caption=f"{i}: {args.validation_prompt}") for i, image in enumerate(images)
+                    ]
+                }
+            )
+    del pipeline
+    torch.cuda.empty_cache()
+    return images
+def save_progress(text_encoder, placeholder_token_ids, accelerator, args, save_path, safe_serialization=True):
+    logger.info("Saving embeddings")
+    learned_embeds = (
+        accelerator.unwrap_model(text_encoder)
+        .get_input_embeddings()
+        .weight[min(placeholder_token_ids) : max(placeholder_token_ids) + 1]
+    )
+    learned_embeds_dict = {args.placeholder_token: learned_embeds.detach().cpu()}
+    if safe_serialization:
+        safetensors.torch.save_file(learned_embeds_dict, save_path, metadata={"format": "pt"})
+    else:
+        torch.save(learned_embeds_dict, save_path)
+def parse_args():
+    parser = argparse.ArgumentParser(description="Simple example of a training script.")
+    parser.add_argument(
+        "--save_steps",
+        type=int,
+        default=500,
+        help="Save learned_embeds.bin every X updates steps.",
+    )
+    parser.add_argument(
+        "--save_as_full_pipeline",
+        action="store_true",
+        help="Save the complete stable diffusion pipeline.",
+    )
+    parser.add_argument(
+        "--num_vectors",
+        type=int,
+        default=1,
+        help="How many textual inversion vectors shall be used to learn the concept.",
+    )
+    parser.add_argument(
+        "--pretrained_model_name_or_path",
+        type=str,
+        default=None,
+        required=True,
+        help="Path to pretrained model or model identifier from huggingface.co/models.",
+    )
+    parser.add_argument(
+        "--revision",
+        type=str,
+        default=None,
+        required=False,
+        help="Revision of pretrained model identifier from huggingface.co/models.",
+    )
+    parser.add_argument(
+        "--variant",
+        type=str,
+        default=None,
+        help="Variant of the model files of the pretrained model identifier from huggingface.co/models, 'e.g.' fp16",
+    )
+    parser.add_argument(
+        "--tokenizer_name",
+        type=str,
+        default=None,
+        help="Pretrained tokenizer name or path if not the same as model_name",
+    )
+    parser.add_argument(
+        "--train_data_dir", type=str, default=None, required=True, help="A folder containing the training data."
+    )
+    parser.add_argument(
+        "--placeholder_token",
+        type=str,
+        default=None,
+        required=True,
+        help="A token to use as a placeholder for the concept.",
+    )
+    parser.add_argument(
+        "--initializer_token", type=str, default=None, required=True, help="A token to use as initializer word."
+    )
+    parser.add_argument("--learnable_property", type=str, default="object", help="Choose between 'object' and 'style'")
+    parser.add_argument("--repeats", type=int, default=100, help="How many times to repeat the training data.")
+    parser.add_argument(
+        "--output_dir",
+        type=str,
+        default="text-inversion-model",
+        help="The output directory where the model predictions and checkpoints will be written.",
+    )
+    parser.add_argument("--seed", type=int, default=None, help="A seed for reproducible training.")
+    parser.add_argument(
+        "--resolution",
+        type=int,
+        default=512,
+        help=(
+            "The resolution for input images, all the images in the train/validation dataset will be resized to this"
+            " resolution"
+        ),
+    )
+    parser.add_argument(
+        "--center_crop", action="store_true", help="Whether to center crop images before resizing to resolution."
+    )
+    parser.add_argument(
+        "--train_batch_size", type=int, default=16, help="Batch size (per device) for the training dataloader."
+    )
+    parser.add_argument("--num_train_epochs", type=int, default=100)
+    parser.add_argument(
+        "--max_train_steps",
+        type=int,
+        default=5000,
+        help="Total number of training steps to perform.  If provided, overrides num_train_epochs.",
+    )
+    parser.add_argument(
+        "--gradient_accumulation_steps",
+        type=int,
+        default=1,
+        help="Number of updates steps to accumulate before performing a backward/update pass.",
+    )
+    parser.add_argument(
+        "--gradient_checkpointing",
+        action="store_true",
+        help="Whether or not to use gradient checkpointing to save memory at the expense of slower backward pass.",
+    )
+    parser.add_argument(
+        "--learning_rate",
+        type=float,
+        default=1e-4,
+        help="Initial learning rate (after the potential warmup period) to use.",
+    )
+    parser.add_argument(
+        "--scale_lr",
+        action="store_true",
+        default=False,
+        help="Scale the learning rate by the number of GPUs, gradient accumulation steps, and batch size.",
+    )
+    parser.add_argument(
+        "--lr_scheduler",
+        type=str,
+        default="constant",
+        help=(
+            'The scheduler type to use. Choose between ["linear", "cosine", "cosine_with_restarts", "polynomial",'
+            ' "constant", "constant_with_warmup"]'
+        ),
+    )
+    parser.add_argument(
+        "--lr_warmup_steps", type=int, default=500, help="Number of steps for the warmup in the lr scheduler."
+    )
+    parser.add_argument(
+        "--lr_num_cycles",
+        type=int,
+        default=1,
+        help="Number of hard resets of the lr in cosine_with_restarts scheduler.",
+    )
+    parser.add_argument(
+        "--dataloader_num_workers",
+        type=int,
+        default=0,
+        help=(
+            "Number of subprocesses to use for data loading. 0 means that the data will be loaded in the main process."
+        ),
+    )
+    parser.add_argument("--adam_beta1", type=float, default=0.9, help="The beta1 parameter for the Adam optimizer.")
+    parser.add_argument("--adam_beta2", type=float, default=0.999, help="The beta2 parameter for the Adam optimizer.")
+    parser.add_argument("--adam_weight_decay", type=float, default=1e-2, help="Weight decay to use.")
+    parser.add_argument("--adam_epsilon", type=float, default=1e-08, help="Epsilon value for the Adam optimizer")
+    parser.add_argument("--push_to_hub", action="store_true", help="Whether or not to push the model to the Hub.")
+    parser.add_argument("--hub_token", type=str, default=None, help="The token to use to push to the Model Hub.")
+    parser.add_argument(
+        "--hub_model_id",
+        type=str,
+        default=None,
+        help="The name of the repository to keep in sync with the local `output_dir`.",
+    )
+    parser.add_argument(
+        "--logging_dir",
+        type=str,
+        default="logs",
+        help=(
+            "[TensorBoard](https://www.tensorflow.org/tensorboard) log directory. Will default to"
+            " *output_dir/runs/**CURRENT_DATETIME_HOSTNAME***."
+        ),
+    )
+    parser.add_argument(
+        "--mixed_precision",
+        type=str,
+        default="no",
+        choices=["no", "fp16", "bf16"],
+        help=(
+            "Whether to use mixed precision. Choose"
+            "between fp16 and bf16 (bfloat16). Bf16 requires PyTorch >= 1.10."
+            "and Nvidia Ampere GPU or Intel Gen 4 Xeon (and later) ."
+        ),
+    )
+    parser.add_argument(
+        "--allow_tf32",
+        action="store_true",
+        help=(
+            "Whether or not to allow TF32 on Ampere GPUs. Can be used to speed up training. For more information, see"
+            " https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices"
+        ),
+    )
+    parser.add_argument(
+        "--report_to",
+        type=str,
+        default="tensorboard",
+        help=(
+            'The integration to report the results and logs to. Supported platforms are `"tensorboard"`'
+            ' (default), `"wandb"` and `"comet_ml"`. Use `"all"` to report to all integrations.'
+        ),
+    )
+    parser.add_argument(
+        "--validation_prompt",
+        type=str,
+        default=None,
+        help="A prompt that is used during validation to verify that the model is learning.",
+    )
+    parser.add_argument(
+        "--num_validation_images",
+        type=int,
+        default=4,
+        help="Number of images that should be generated during validation with `validation_prompt`.",
+    )
+    parser.add_argument(
+        "--validation_steps",
+        type=int,
+        default=100,
+        help=(
+            "Run validation every X steps. Validation consists of running the prompt"
+            " `args.validation_prompt` multiple times: `args.num_validation_images`"
+            " and logging the images."
+        ),
+    )
+    parser.add_argument(
+        "--validation_epochs",
+        type=int,
+        default=None,
+        help=(
+            "Deprecated in favor of validation_steps. Run validation every X epochs. Validation consists of running the prompt"
+            " `args.validation_prompt` multiple times: `args.num_validation_images`"
+            " and logging the images."
+        ),
+    )
+    parser.add_argument("--local_rank", type=int, default=-1, help="For distributed training: local_rank")
+    parser.add_argument(
+        "--checkpointing_steps",
+        type=int,
+        default=500,
+        help=(
+            "Save a checkpoint of the training state every X updates. These checkpoints are only suitable for resuming"
+            " training using `--resume_from_checkpoint`."
+        ),
+    )
+    parser.add_argument(
+        "--checkpoints_total_limit",
+        type=int,
+        default=None,
+        help=("Max number of checkpoints to store."),
+    )
+    parser.add_argument(
+        "--resume_from_checkpoint",
+        type=str,
+        default=None,
+        help=(
+            "Whether training should be resumed from a previous checkpoint. Use a path saved by"
+            ' `--checkpointing_steps`, or `"latest"` to automatically select the last available checkpoint.'
+        ),
+    )
+    parser.add_argument(
+        "--enable_xformers_memory_efficient_attention", action="store_true", help="Whether or not to use xformers."
+    )
+    parser.add_argument(
+        "--no_safe_serialization",
+        action="store_true",
+        help="If specified save the checkpoint not in `safetensors` format, but in original PyTorch format instead.",
+    )
+    args = parser.parse_args()
+    env_local_rank = int(os.environ.get("LOCAL_RANK", -1))
+    if env_local_rank != -1 and env_local_rank != args.local_rank:
+        args.local_rank = env_local_rank
+    if args.train_data_dir is None:
+        raise ValueError("You must specify a train data directory.")
+    return args
+imagenet_templates_small = [
+    "a photo of a {}",
+    "a rendering of a {}",
+    "a cropped photo of the {}",
+    "the photo of a {}",
+    "a photo of a clean {}",
+    "a photo of a dirty {}",
+    "a dark photo of the {}",
+    "a photo of my {}",
+    "a photo of the cool {}",
+    "a close-up photo of a {}",
+    "a bright photo of the {}",
+    "a cropped photo of a {}",
+    "a photo of the {}",
+    "a good photo of the {}",
+    "a photo of one {}",
+    "a close-up photo of the {}",
+    "a rendition of the {}",
+    "a photo of the clean {}",
+    "a rendition of a {}",
+    "a photo of a nice {}",
+    "a good photo of a {}",
+    "a photo of the nice {}",
+    "a photo of the small {}",
+    "a photo of the weird {}",
+    "a photo of the large {}",
+    "a photo of a cool {}",
+    "a photo of a small {}",
+]
+imagenet_style_templates_small = [
+    "a painting in the style of {}",
+    "a rendering in the style of {}",
+    "a cropped painting in the style of {}",
+    "the painting in the style of {}",
+    "a clean painting in the style of {}",
+    "a dirty painting in the style of {}",
+    "a dark painting in the style of {}",
+    "a picture in the style of {}",
+    "a cool painting in the style of {}",
+    "a close-up painting in the style of {}",
+    "a bright painting in the style of {}",
+    "a cropped painting in the style of {}",
+    "a good painting in the style of {}",
+    "a close-up painting in the style of {}",
+    "a rendition in the style of {}",
+    "a nice painting in the style of {}",
+    "a small painting in the style of {}",
+    "a weird painting in the style of {}",
+    "a large painting in the style of {}",
+]
+class TextualInversionDataset(Dataset):
+    def __init__(
+        self,
+        data_root,
+        tokenizer,
+        learnable_property="object",  # [object, style]
+        size=512,
+        repeats=100,
+        interpolation="bicubic",
+        flip_p=0.5,
+        set="train",
+        placeholder_token="*",
+        center_crop=False,
+    ):
+        self.data_root = data_root
+        self.tokenizer = tokenizer
+        self.learnable_property = learnable_property
+        self.size = size
+        self.placeholder_token = placeholder_token
+        self.center_crop = center_crop
+        self.flip_p = flip_p
+        self.image_paths = [os.path.join(self.data_root, file_path) for file_path in os.listdir(self.data_root)]
+        self.num_images = len(self.image_paths)
+        self._length = self.num_images
+        if set == "train":
+            self._length = self.num_images * repeats
+        self.interpolation = {
+            "linear": PIL_INTERPOLATION["linear"],
+            "bilinear": PIL_INTERPOLATION["bilinear"],
+            "bicubic": PIL_INTERPOLATION["bicubic"],
+            "lanczos": PIL_INTERPOLATION["lanczos"],
+        }[interpolation]
+        self.templates = imagenet_style_templates_small if learnable_property == "style" else imagenet_templates_small
+        self.flip_transform = transforms.RandomHorizontalFlip(p=self.flip_p)
+    def __len__(self):
+        return self._length
+    def __getitem__(self, i):
+        example = {}
+        image = Image.open(self.image_paths[i % self.num_images])
+        if not image.mode == "RGB":
+            image = image.convert("RGB")
+        placeholder_string = self.placeholder_token
+        text = random.choice(self.templates).format(placeholder_string)
+        example["input_ids"] = self.tokenizer(
+            text,
+            padding="max_length",
+            truncation=True,
+            max_length=self.tokenizer.model_max_length,
+            return_tensors="pt",
+        ).input_ids[0]
+        # default to score-sde preprocessing
+        img = np.array(image).astype(np.uint8)
+        if self.center_crop:
+            crop = min(img.shape[0], img.shape[1])
+            (
+                h,
+                w,
+            ) = (
+                img.shape[0],
+                img.shape[1],
+            )
+            img = img[(h - crop) // 2 : (h + crop) // 2, (w - crop) // 2 : (w + crop) // 2]
+        image = Image.fromarray(img)
+        image = image.resize((self.size, self.size), resample=self.interpolation)
+        image = self.flip_transform(image)
+        image = np.array(image).astype(np.uint8)
+        image = (image / 127.5 - 1.0).astype(np.float32)
+        example["pixel_values"] = torch.from_numpy(image).permute(2, 0, 1)
+        return example
+def main():
+    args = parse_args()
+    if args.report_to == "wandb" and args.hub_token is not None:
+        raise ValueError(
+            "You cannot use both --report_to=wandb and --hub_token due to a security risk of exposing your token."
+            " Please use `huggingface-cli login` to authenticate with the Hub."
+        )
+    logging_dir = os.path.join(args.output_dir, args.logging_dir)
+    accelerator_project_config = ProjectConfiguration(project_dir=args.output_dir, logging_dir=logging_dir)
+    accelerator = Accelerator(
+        gradient_accumulation_steps=args.gradient_accumulation_steps,
+        mixed_precision=args.mixed_precision,
+        log_with=args.report_to,
+        project_config=accelerator_project_config,
+    )
+    # Disable AMP for MPS.
+    if torch.backends.mps.is_available():
+        accelerator.native_amp = False
+    if args.report_to == "wandb":
+        if not is_wandb_available():
+            raise ImportError("Make sure to install wandb if you want to use it for logging during training.")
+    # Make one log on every process with the configuration for debugging.
+    logging.basicConfig(
+        format="%(asctime)s - %(levelname)s - %(name)s - %(message)s",
+        datefmt="%m/%d/%Y %H:%M:%S",
+        level=logging.INFO,
+    )
+    logger.info(accelerator.state, main_process_only=False)
+    if accelerator.is_local_main_process:
+        transformers.utils.logging.set_verbosity_warning()
+        diffusers.utils.logging.set_verbosity_info()
+    else:
+        transformers.utils.logging.set_verbosity_error()
+        diffusers.utils.logging.set_verbosity_error()
+    # If passed along, set the training seed now.
+    if args.seed is not None:
+        set_seed(args.seed)
+    # Handle the repository creation
+    if accelerator.is_main_process:
+        if args.output_dir is not None:
+            os.makedirs(args.output_dir, exist_ok=True)
+        if args.push_to_hub:
+            repo_id = create_repo(
+                repo_id=args.hub_model_id or Path(args.output_dir).name, exist_ok=True, token=args.hub_token
+            ).repo_id
+    # Load tokenizer
+    if args.tokenizer_name:
+        tokenizer = CLIPTokenizer.from_pretrained(args.tokenizer_name)
+    elif args.pretrained_model_name_or_path:
+        tokenizer = CLIPTokenizer.from_pretrained(args.pretrained_model_name_or_path, subfolder="tokenizer")
+    # Load scheduler and models
+    noise_scheduler = DDPMScheduler.from_pretrained(args.pretrained_model_name_or_path, subfolder="scheduler")
+    text_encoder = CLIPTextModel.from_pretrained(
+        args.pretrained_model_name_or_path, subfolder="text_encoder", revision=args.revision
+    )
+    vae = AutoencoderKL.from_pretrained(
+        args.pretrained_model_name_or_path, subfolder="vae", revision=args.revision, variant=args.variant
+    )
+    unet = UNet2DConditionModel.from_pretrained(
+        args.pretrained_model_name_or_path, subfolder="unet", revision=args.revision, variant=args.variant
+    )
+    # Add the placeholder token in tokenizer
+    placeholder_tokens = [args.placeholder_token]
+    if args.num_vectors < 1:
+        raise ValueError(f"--num_vectors has to be larger or equal to 1, but is {args.num_vectors}")
+    # add dummy tokens for multi-vector
+    additional_tokens = []
+    for i in range(1, args.num_vectors):
+        additional_tokens.append(f"{args.placeholder_token}_{i}")
+    placeholder_tokens += additional_tokens
+    num_added_tokens = tokenizer.add_tokens(placeholder_tokens)
+    if num_added_tokens != args.num_vectors:
+        raise ValueError(
+            f"The tokenizer already contains the token {args.placeholder_token}. Please pass a different"
+            " `placeholder_token` that is not already in the tokenizer."
+        )
+    # Convert the initializer_token, placeholder_token to ids
+    token_ids = tokenizer.encode(args.initializer_token, add_special_tokens=False)
+    # Check if initializer_token is a single token or a sequence of tokens
+    if len(token_ids) > 1:
+        raise ValueError("The initializer token must be a single token.")
+    initializer_token_id = token_ids[0]
+    placeholder_token_ids = tokenizer.convert_tokens_to_ids(placeholder_tokens)
+    # Resize the token embeddings as we are adding new special tokens to the tokenizer
+    text_encoder.resize_token_embeddings(len(tokenizer))
+    # Initialise the newly added placeholder token with the embeddings of the initializer token
+    token_embeds = text_encoder.get_input_embeddings().weight.data
+    with torch.no_grad():
+        for token_id in placeholder_token_ids:
+            token_embeds[token_id] = token_embeds[initializer_token_id].clone()
+    # Freeze vae and unet
+    vae.requires_grad_(False)
+    unet.requires_grad_(False)
+    # Freeze all parameters except for the token embeddings in text encoder
+    text_encoder.text_model.encoder.requires_grad_(False)
+    text_encoder.text_model.final_layer_norm.requires_grad_(False)
+    text_encoder.text_model.embeddings.position_embedding.requires_grad_(False)
+    if args.gradient_checkpointing:
+        # Keep unet in train mode if we are using gradient checkpointing to save memory.
+        # The dropout cannot be != 0 so it doesn't matter if we are in eval or train mode.
+        unet.train()
+        text_encoder.gradient_checkpointing_enable()
+        unet.enable_gradient_checkpointing()
+    if args.enable_xformers_memory_efficient_attention:
+        if is_xformers_available():
+            import xformers
+            xformers_version = version.parse(xformers.__version__)
+            if xformers_version == version.parse("0.0.16"):
+                logger.warning(
+                    "xFormers 0.0.16 cannot be used for training in some GPUs. If you observe problems during training, please update xFormers to at least 0.0.17. See https://huggingface.co/docs/diffusers/main/en/optimization/xformers for more details."
+                )
+            unet.enable_xformers_memory_efficient_attention()
+        else:
+            raise ValueError("xformers is not available. Make sure it is installed correctly")
+    # Enable TF32 for faster training on Ampere GPUs,
+    # cf https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
+    if args.allow_tf32:
+        torch.backends.cuda.matmul.allow_tf32 = True
+    if args.scale_lr:
+        args.learning_rate = (
+            args.learning_rate * args.gradient_accumulation_steps * args.train_batch_size * accelerator.num_processes
+        )
+    # Initialize the optimizer
+    optimizer = torch.optim.AdamW(
+        text_encoder.get_input_embeddings().parameters(),  # only optimize the embeddings
+        lr=args.learning_rate,
+        betas=(args.adam_beta1, args.adam_beta2),
+        weight_decay=args.adam_weight_decay,
+        eps=args.adam_epsilon,
+    )
+    # Dataset and DataLoaders creation:
+    train_dataset = TextualInversionDataset(
+        data_root=args.train_data_dir,
+        tokenizer=tokenizer,
+        size=args.resolution,
+        placeholder_token=(" ".join(tokenizer.convert_ids_to_tokens(placeholder_token_ids))),
+        repeats=args.repeats,
+        learnable_property=args.learnable_property,
+        center_crop=args.center_crop,
+        set="train",
+    )
+    train_dataloader = torch.utils.data.DataLoader(
+        train_dataset, batch_size=args.train_batch_size, shuffle=True, num_workers=args.dataloader_num_workers
+    )
+    if args.validation_epochs is not None:
+        warnings.warn(
+            f"FutureWarning: You are doing logging with validation_epochs={args.validation_epochs}."
+            " Deprecated validation_epochs in favor of `validation_steps`"
+            f"Setting `args.validation_steps` to {args.validation_epochs * len(train_dataset)}",
+            FutureWarning,
+            stacklevel=2,
+        )
+        args.validation_steps = args.validation_epochs * len(train_dataset)
+    # Scheduler and math around the number of training steps.
+    overrode_max_train_steps = False
+    num_update_steps_per_epoch = math.ceil(len(train_dataloader) / args.gradient_accumulation_steps)
+    if args.max_train_steps is None:
+        args.max_train_steps = args.num_train_epochs * num_update_steps_per_epoch
+        overrode_max_train_steps = True
+    lr_scheduler = get_scheduler(
+        args.lr_scheduler,
+        optimizer=optimizer,
+        num_warmup_steps=args.lr_warmup_steps * accelerator.num_processes,
+        num_training_steps=args.max_train_steps * accelerator.num_processes,
+        num_cycles=args.lr_num_cycles,
+    )
+    text_encoder.train()
+    # Prepare everything with our `accelerator`.
+    text_encoder, optimizer, train_dataloader, lr_scheduler = accelerator.prepare(
+        text_encoder, optimizer, train_dataloader, lr_scheduler
+    )
+    # For mixed precision training we cast all non-trainable weigths (vae, non-lora text_encoder and non-lora unet) to half-precision
+    # as these weights are only used for inference, keeping weights in full precision is not required.
+    weight_dtype = torch.float32
+    if accelerator.mixed_precision == "fp16":
+        weight_dtype = torch.float16
+    elif accelerator.mixed_precision == "bf16":
+        weight_dtype = torch.bfloat16
+    # Move vae and unet to device and cast to weight_dtype
+    unet.to(accelerator.device, dtype=weight_dtype)
+    vae.to(accelerator.device, dtype=weight_dtype)
+    # We need to recalculate our total training steps as the size of the training dataloader may have changed.
+    num_update_steps_per_epoch = math.ceil(len(train_dataloader) / args.gradient_accumulation_steps)
+    if overrode_max_train_steps:
+        args.max_train_steps = args.num_train_epochs * num_update_steps_per_epoch
+    # Afterwards we recalculate our number of training epochs
+    args.num_train_epochs = math.ceil(args.max_train_steps / num_update_steps_per_epoch)
+    # We need to initialize the trackers we use, and also store our configuration.
+    # The trackers initializes automatically on the main process.
+    if accelerator.is_main_process:
+        accelerator.init_trackers("textual_inversion", config=vars(args))
+    # Train!
+    total_batch_size = args.train_batch_size * accelerator.num_processes * args.gradient_accumulation_steps
+    logger.info("***** Running training *****")
+    logger.info(f"  Num examples = {len(train_dataset)}")
+    logger.info(f"  Num Epochs = {args.num_train_epochs}")
+    logger.info(f"  Instantaneous batch size per device = {args.train_batch_size}")
+    logger.info(f"  Total train batch size (w. parallel, distributed & accumulation) = {total_batch_size}")
+    logger.info(f"  Gradient Accumulation steps = {args.gradient_accumulation_steps}")
+    logger.info(f"  Total optimization steps = {args.max_train_steps}")
+    global_step = 0
+    first_epoch = 0
+    # Potentially load in the weights and states from a previous save
+    if args.resume_from_checkpoint:
+        if args.resume_from_checkpoint != "latest":
+            path = os.path.basename(args.resume_from_checkpoint)
+        else:
+            # Get the most recent checkpoint
+            dirs = os.listdir(args.output_dir)
+            dirs = [d for d in dirs if d.startswith("checkpoint")]
+            dirs = sorted(dirs, key=lambda x: int(x.split("-")[1]))
+            path = dirs[-1] if len(dirs) > 0 else None
+        if path is None:
+            accelerator.print(
+                f"Checkpoint '{args.resume_from_checkpoint}' does not exist. Starting a new training run."
+            )
+            args.resume_from_checkpoint = None
+            initial_global_step = 0
+        else:
+            accelerator.print(f"Resuming from checkpoint {path}")
+            accelerator.load_state(os.path.join(args.output_dir, path))
+            global_step = int(path.split("-")[1])
+            initial_global_step = global_step
+            first_epoch = global_step // num_update_steps_per_epoch
+    else:
+        initial_global_step = 0
+    progress_bar = tqdm(
+        range(0, args.max_train_steps),
+        initial=initial_global_step,
+        desc="Steps",
+        # Only show the progress bar once on each machine.
+        disable=not accelerator.is_local_main_process,
+    )
+    # keep original embeddings as reference
+    orig_embeds_params = accelerator.unwrap_model(text_encoder).get_input_embeddings().weight.data.clone()
+    for epoch in range(first_epoch, args.num_train_epochs):
+        text_encoder.train()
+        for step, batch in enumerate(train_dataloader):
+            with accelerator.accumulate(text_encoder):
+                # Convert images to latent space
+                latents = vae.encode(batch["pixel_values"].to(dtype=weight_dtype)).latent_dist.sample().detach()
+                latents = latents * vae.config.scaling_factor
+                # Sample noise that we'll add to the latents
+                noise = torch.randn_like(latents)
+                bsz = latents.shape[0]
+                # Sample a random timestep for each image
+                timesteps = torch.randint(0, noise_scheduler.config.num_train_timesteps, (bsz,), device=latents.device)
+                timesteps = timesteps.long()
+                # Add noise to the latents according to the noise magnitude at each timestep
+                # (this is the forward diffusion process)
+                noisy_latents = noise_scheduler.add_noise(latents, noise, timesteps)
+                # Get the text embedding for conditioning
+                encoder_hidden_states = text_encoder(batch["input_ids"])[0].to(dtype=weight_dtype)
+                # Predict the noise residual
+                model_pred = unet(noisy_latents, timesteps, encoder_hidden_states).sample
+                # Get the target for loss depending on the prediction type
+                if noise_scheduler.config.prediction_type == "epsilon":
+                    target = noise
+                elif noise_scheduler.config.prediction_type == "v_prediction":
+                    target = noise_scheduler.get_velocity(latents, noise, timesteps)
+                else:
+                    raise ValueError(f"Unknown prediction type {noise_scheduler.config.prediction_type}")
+                loss = F.mse_loss(model_pred.float(), target.float(), reduction="mean")
+                accelerator.backward(loss)
+                optimizer.step()
+                lr_scheduler.step()
+                optimizer.zero_grad()
+                # Let's make sure we don't update any embedding weights besides the newly added token
+                index_no_updates = torch.ones((len(tokenizer),), dtype=torch.bool)
+                index_no_updates[min(placeholder_token_ids) : max(placeholder_token_ids) + 1] = False
+                with torch.no_grad():
+                    accelerator.unwrap_model(text_encoder).get_input_embeddings().weight[
+                        index_no_updates
+                    ] = orig_embeds_params[index_no_updates]
+            # Checks if the accelerator has performed an optimization step behind the scenes
+            if accelerator.sync_gradients:
+                images = []
+                progress_bar.update(1)
+                global_step += 1
+                if global_step % args.save_steps == 0:
+                    weight_name = (
+                        f"learned_embeds-steps-{global_step}.bin"
+                        if args.no_safe_serialization
+                        else f"learned_embeds-steps-{global_step}.safetensors"
+                    )
+                    save_path = os.path.join(args.output_dir, weight_name)
+                    save_progress(
+                        text_encoder,
+                        placeholder_token_ids,
+                        accelerator,
+                        args,
+                        save_path,
+                        safe_serialization=not args.no_safe_serialization,
+                    )
+                if accelerator.is_main_process:
+                    if global_step % args.checkpointing_steps == 0:
+                        # _before_ saving state, check if this save would set us over the `checkpoints_total_limit`
+                        if args.checkpoints_total_limit is not None:
+                            checkpoints = os.listdir(args.output_dir)
+                            checkpoints = [d for d in checkpoints if d.startswith("checkpoint")]
+                            checkpoints = sorted(checkpoints, key=lambda x: int(x.split("-")[1]))
+                            # before we save the new checkpoint, we need to have at _most_ `checkpoints_total_limit - 1` checkpoints
+                            if len(checkpoints) >= args.checkpoints_total_limit:
+                                num_to_remove = len(checkpoints) - args.checkpoints_total_limit + 1
+                                removing_checkpoints = checkpoints[0:num_to_remove]
+                                logger.info(
+                                    f"{len(checkpoints)} checkpoints already exist, removing {len(removing_checkpoints)} checkpoints"
+                                )
+                                logger.info(f"removing checkpoints: {', '.join(removing_checkpoints)}")
+                                for removing_checkpoint in removing_checkpoints:
+                                    removing_checkpoint = os.path.join(args.output_dir, removing_checkpoint)
+                                    shutil.rmtree(removing_checkpoint)
+                        save_path = os.path.join(args.output_dir, f"checkpoint-{global_step}")
+                        accelerator.save_state(save_path)
+                        logger.info(f"Saved state to {save_path}")
+                    if args.validation_prompt is not None and global_step % args.validation_steps == 0:
+                        images = log_validation(
+                            text_encoder, tokenizer, unet, vae, args, accelerator, weight_dtype, epoch
+                        )
+            logs = {"loss": loss.detach().item(), "lr": lr_scheduler.get_last_lr()[0]}
+            progress_bar.set_postfix(**logs)
+            accelerator.log(logs, step=global_step)
+            if global_step >= args.max_train_steps:
+                break
+    # Create the pipeline using the trained modules and save it.
+    accelerator.wait_for_everyone()
+    if accelerator.is_main_process:
+        if args.push_to_hub and not args.save_as_full_pipeline:
+            logger.warning("Enabling full model saving because --push_to_hub=True was specified.")
+            save_full_model = True
+        else:
+            save_full_model = args.save_as_full_pipeline
+        if save_full_model:
+            pipeline = StableDiffusionPipeline.from_pretrained(
+                args.pretrained_model_name_or_path,
+                text_encoder=accelerator.unwrap_model(text_encoder),
+                vae=vae,
+                unet=unet,
+                tokenizer=tokenizer,
+            )
+            pipeline.save_pretrained(args.output_dir)
+        # Save the newly trained embeddings
+        weight_name = "learned_embeds.bin" if args.no_safe_serialization else "learned_embeds.safetensors"
+        save_path = os.path.join(args.output_dir, weight_name)
+        save_progress(
+            text_encoder,
+            placeholder_token_ids,
+            accelerator,
+            args,
+            save_path,
+            safe_serialization=not args.no_safe_serialization,
+        )
+        if args.push_to_hub:
+            save_model_card(
+                repo_id,
+                images=images,
+                base_model=args.pretrained_model_name_or_path,
+                repo_folder=args.output_dir,
+            )
+            upload_folder(
+                repo_id=repo_id,
+                folder_path=args.output_dir,
+                commit_message="End of training",
+                ignore_patterns=["step_*", "epoch_*"],
+            )
+    accelerator.end_training()
+if __name__ == "__main__":
+    main()

Gradient_ascent_traininig_scripts/train.sh ADDED Viewed

	@@ -0,0 +1,16 @@

+export MODEL_NAME="CompVis/stable-diffusion-v1-4"
+export TRAIN_DIR="./generation/english_springer_erasure"
+accelerate launch --mixed_precision="fp16" train_text_to_image.py \
+  --pretrained_model_name_or_path=$MODEL_NAME \
+  --train_data_dir=$TRAIN_DIR \
+  --use_ema \
+  --resolution=512 --center_crop --random_flip \
+  --train_batch_size=5 \
+  --gradient_accumulation_steps=4 \
+  --gradient_checkpointing \
+  --max_train_steps=10 \
+  --learning_rate=1e-05 \
+  --max_grad_norm=1 \
+  --lr_scheduler="constant" --lr_warmup_steps=0 \
+  --output_dir="./checkpoint/english_springer"

Gradient_ascent_traininig_scripts/train_text_to_image.py ADDED Viewed

	@@ -0,0 +1,1156 @@

+#!/usr/bin/env python
+# coding=utf-8
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import argparse
+import logging
+import math
+import os
+import random
+import shutil
+from contextlib import nullcontext
+from pathlib import Path
+import accelerate
+import datasets
+import numpy as np
+import torch
+import torch.nn.functional as F
+import torch.utils.checkpoint
+import transformers
+from accelerate import Accelerator
+from accelerate.logging import get_logger
+from accelerate.state import AcceleratorState
+from accelerate.utils import ProjectConfiguration, set_seed
+from datasets import load_dataset
+from huggingface_hub import create_repo, upload_folder
+from packaging import version
+from torchvision import transforms
+from tqdm.auto import tqdm
+from transformers import CLIPTextModel, CLIPTokenizer
+from transformers.utils import ContextManagers
+import diffusers
+from diffusers import AutoencoderKL, DDPMScheduler, StableDiffusionPipeline, UNet2DConditionModel
+from diffusers.optimization import get_scheduler
+from diffusers.training_utils import EMAModel, compute_dream_and_update_latents, compute_snr
+from diffusers.utils import check_min_version, deprecate, is_wandb_available, make_image_grid
+from diffusers.utils.hub_utils import load_or_create_model_card, populate_model_card
+from diffusers.utils.import_utils import is_xformers_available
+from diffusers.utils.torch_utils import is_compiled_module
+import torch
+if is_wandb_available():
+    import wandb
+# Will error if the minimal version of diffusers is not installed. Remove at your own risks.
+check_min_version("0.31.0.dev0")
+logger = get_logger(__name__, log_level="INFO")
+DATASET_NAME_MAPPING = {
+    "lambdalabs/naruto-blip-captions": ("image", "text"),
+}
+def save_model_card(
+    args,
+    repo_id: str,
+    images: list = None,
+    repo_folder: str = None,
+):
+    img_str = ""
+    if len(images) > 0:
+        image_grid = make_image_grid(images, 1, len(args.validation_prompts))
+        image_grid.save(os.path.join(repo_folder, "val_imgs_grid.png"))
+        img_str += "![val_imgs_grid](./val_imgs_grid.png)\n"
+    model_description = f"""
+# Text-to-image finetuning - {repo_id}
+This pipeline was finetuned from **{args.pretrained_model_name_or_path}** on the **{args.dataset_name}** dataset. Below are some example images generated with the finetuned pipeline using the following prompts: {args.validation_prompts}: \n
+{img_str}
+## Pipeline usage
+You can use the pipeline like so:
+```python
+from diffusers import DiffusionPipeline
+import torch
+pipeline = DiffusionPipeline.from_pretrained("{repo_id}", torch_dtype=torch.float16)
+prompt = "{args.validation_prompts[0]}"
+image = pipeline(prompt).images[0]
+image.save("my_image.png")
+```
+## Training info
+These are the key hyperparameters used during training:
+* Epochs: {args.num_train_epochs}
+* Learning rate: {args.learning_rate}
+* Batch size: {args.train_batch_size}
+* Gradient accumulation steps: {args.gradient_accumulation_steps}
+* Image resolution: {args.resolution}
+* Mixed-precision: {args.mixed_precision}
+"""
+    wandb_info = ""
+    if is_wandb_available():
+        wandb_run_url = None
+        if wandb.run is not None:
+            wandb_run_url = wandb.run.url
+    if wandb_run_url is not None:
+        wandb_info = f"""
+More information on all the CLI arguments and the environment are available on your [`wandb` run page]({wandb_run_url}).
+"""
+    model_description += wandb_info
+    model_card = load_or_create_model_card(
+        repo_id_or_path=repo_id,
+        from_training=True,
+        license="creativeml-openrail-m",
+        base_model=args.pretrained_model_name_or_path,
+        model_description=model_description,
+        inference=True,
+    )
+    tags = ["stable-diffusion", "stable-diffusion-diffusers", "text-to-image", "diffusers", "diffusers-training"]
+    model_card = populate_model_card(model_card, tags=tags)
+    model_card.save(os.path.join(repo_folder, "README.md"))
+def log_validation(vae, text_encoder, tokenizer, unet, args, accelerator, weight_dtype, epoch):
+    logger.info("Running validation... ")
+    pipeline = StableDiffusionPipeline.from_pretrained(
+        args.pretrained_model_name_or_path,
+        vae=accelerator.unwrap_model(vae),
+        text_encoder=accelerator.unwrap_model(text_encoder),
+        tokenizer=tokenizer,
+        unet=accelerator.unwrap_model(unet),
+        safety_checker=None,
+        revision=args.revision,
+        variant=args.variant,
+        torch_dtype=weight_dtype,
+    )
+    pipeline = pipeline.to(accelerator.device)
+    pipeline.set_progress_bar_config(disable=True)
+    if args.enable_xformers_memory_efficient_attention:
+        pipeline.enable_xformers_memory_efficient_attention()
+    if args.seed is None:
+        generator = None
+    else:
+        generator = torch.Generator(device=accelerator.device).manual_seed(args.seed)
+    images = []
+    for i in range(len(args.validation_prompts)):
+        if torch.backends.mps.is_available():
+            autocast_ctx = nullcontext()
+        else:
+            autocast_ctx = torch.autocast(accelerator.device.type)
+        with autocast_ctx:
+            image = pipeline(args.validation_prompts[i], num_inference_steps=20, generator=generator).images[0]
+        images.append(image)
+    for tracker in accelerator.trackers:
+        if tracker.name == "tensorboard":
+            np_images = np.stack([np.asarray(img) for img in images])
+            tracker.writer.add_images("validation", np_images, epoch, dataformats="NHWC")
+        elif tracker.name == "wandb":
+            tracker.log(
+                {
+                    "validation": [
+                        wandb.Image(image, caption=f"{i}: {args.validation_prompts[i]}")
+                        for i, image in enumerate(images)
+                    ]
+                }
+            )
+        else:
+            logger.warning(f"image logging not implemented for {tracker.name}")
+    del pipeline
+    torch.cuda.empty_cache()
+    return images
+def parse_args():
+    parser = argparse.ArgumentParser(description="Simple example of a training script.")
+    parser.add_argument(
+        "--input_perturbation", type=float, default=0, help="The scale of input perturbation. Recommended 0.1."
+    )
+    parser.add_argument(
+        "--pretrained_model_name_or_path",
+        type=str,
+        default=None,
+        required=True,
+        help="Path to pretrained model or model identifier from huggingface.co/models.",
+    )
+    parser.add_argument(
+        "--revision",
+        type=str,
+        default=None,
+        required=False,
+        help="Revision of pretrained model identifier from huggingface.co/models.",
+    )
+    parser.add_argument(
+        "--variant",
+        type=str,
+        default=None,
+        help="Variant of the model files of the pretrained model identifier from huggingface.co/models, 'e.g.' fp16",
+    )
+    parser.add_argument(
+        "--dataset_name",
+        type=str,
+        default=None,
+        help=(
+            "The name of the Dataset (from the HuggingFace hub) to train on (could be your own, possibly private,"
+            " dataset). It can also be a path pointing to a local copy of a dataset in your filesystem,"
+            " or to a folder containing files that 🤗 Datasets can understand."
+        ),
+    )
+    parser.add_argument(
+        "--dataset_config_name",
+        type=str,
+        default=None,
+        help="The config of the Dataset, leave as None if there's only one config.",
+    )
+    parser.add_argument(
+        "--train_data_dir",
+        type=str,
+        default=None,
+        help=(
+            "A folder containing the training data. Folder contents must follow the structure described in"
+            " https://huggingface.co/docs/datasets/image_dataset#imagefolder. In particular, a `metadata.jsonl` file"
+            " must exist to provide the captions for the images. Ignored if `dataset_name` is specified."
+        ),
+    )
+    parser.add_argument(
+        "--image_column", type=str, default="image", help="The column of the dataset containing an image."
+    )
+    parser.add_argument(
+        "--caption_column",
+        type=str,
+        default="text",
+        help="The column of the dataset containing a caption or a list of captions.",
+    )
+    parser.add_argument(
+        "--max_train_samples",
+        type=int,
+        default=None,
+        help=(
+            "For debugging purposes or quicker training, truncate the number of training examples to this "
+            "value if set."
+        ),
+    )
+    parser.add_argument(
+        "--validation_prompts",
+        type=str,
+        default=None,
+        nargs="+",
+        help=("A set of prompts evaluated every `--validation_epochs` and logged to `--report_to`."),
+    )
+    parser.add_argument(
+        "--output_dir",
+        type=str,
+        default="sd-model-finetuned",
+        help="The output directory where the model predictions and checkpoints will be written.",
+    )
+    parser.add_argument(
+        "--cache_dir",
+        type=str,
+        default=None,
+        help="The directory where the downloaded models and datasets will be stored.",
+    )
+    parser.add_argument("--seed", type=int, default=None, help="A seed for reproducible training.")
+    parser.add_argument(
+        "--resolution",
+        type=int,
+        default=512,
+        help=(
+            "The resolution for input images, all the images in the train/validation dataset will be resized to this"
+            " resolution"
+        ),
+    )
+    parser.add_argument(
+        "--center_crop",
+        default=False,
+        action="store_true",
+        help=(
+            "Whether to center crop the input images to the resolution. If not set, the images will be randomly"
+            " cropped. The images will be resized to the resolution first before cropping."
+        ),
+    )
+    parser.add_argument(
+        "--random_flip",
+        action="store_true",
+        help="whether to randomly flip images horizontally",
+    )
+    parser.add_argument(
+        "--train_batch_size", type=int, default=16, help="Batch size (per device) for the training dataloader."
+    )
+    parser.add_argument("--num_train_epochs", type=int, default=100)
+    parser.add_argument(
+        "--max_train_steps",
+        type=int,
+        default=None,
+        help="Total number of training steps to perform.  If provided, overrides num_train_epochs.",
+    )
+    parser.add_argument(
+        "--gradient_accumulation_steps",
+        type=int,
+        default=1,
+        help="Number of updates steps to accumulate before performing a backward/update pass.",
+    )
+    parser.add_argument(
+        "--gradient_checkpointing",
+        action="store_true",
+        help="Whether or not to use gradient checkpointing to save memory at the expense of slower backward pass.",
+    )
+    parser.add_argument(
+        "--learning_rate",
+        type=float,
+        default=1e-4,
+        help="Initial learning rate (after the potential warmup period) to use.",
+    )
+    parser.add_argument(
+        "--scale_lr",
+        action="store_true",
+        default=False,
+        help="Scale the learning rate by the number of GPUs, gradient accumulation steps, and batch size.",
+    )
+    parser.add_argument(
+        "--lr_scheduler",
+        type=str,
+        default="constant",
+        help=(
+            'The scheduler type to use. Choose between ["linear", "cosine", "cosine_with_restarts", "polynomial",'
+            ' "constant", "constant_with_warmup"]'
+        ),
+    )
+    parser.add_argument(
+        "--lr_warmup_steps", type=int, default=500, help="Number of steps for the warmup in the lr scheduler."
+    )
+    parser.add_argument(
+        "--snr_gamma",
+        type=float,
+        default=None,
+        help="SNR weighting gamma to be used if rebalancing the loss. Recommended value is 5.0. "
+        "More details here: https://arxiv.org/abs/2303.09556.",
+    )
+    parser.add_argument(
+        "--dream_training",
+        action="store_true",
+        help=(
+            "Use the DREAM training method, which makes training more efficient and accurate at the ",
+            "expense of doing an extra forward pass. See: https://arxiv.org/abs/2312.00210",
+        ),
+    )
+    parser.add_argument(
+        "--dream_detail_preservation",
+        type=float,
+        default=1.0,
+        help="Dream detail preservation factor p (should be greater than 0; default=1.0, as suggested in the paper)",
+    )
+    parser.add_argument(
+        "--use_8bit_adam", action="store_true", help="Whether or not to use 8-bit Adam from bitsandbytes."
+    )
+    parser.add_argument(
+        "--allow_tf32",
+        action="store_true",
+        help=(
+            "Whether or not to allow TF32 on Ampere GPUs. Can be used to speed up training. For more information, see"
+            " https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices"
+        ),
+    )
+    parser.add_argument("--use_ema", action="store_true", help="Whether to use EMA model.")
+    parser.add_argument("--offload_ema", action="store_true", help="Offload EMA model to CPU during training step.")
+    parser.add_argument("--foreach_ema", action="store_true", help="Use faster foreach implementation of EMAModel.")
+    parser.add_argument(
+        "--non_ema_revision",
+        type=str,
+        default=None,
+        required=False,
+        help=(
+            "Revision of pretrained non-ema model identifier. Must be a branch, tag or git identifier of the local or"
+            " remote repository specified with --pretrained_model_name_or_path."
+        ),
+    )
+    parser.add_argument(
+        "--dataloader_num_workers",
+        type=int,
+        default=0,
+        help=(
+            "Number of subprocesses to use for data loading. 0 means that the data will be loaded in the main process."
+        ),
+    )
+    parser.add_argument("--adam_beta1", type=float, default=0.9, help="The beta1 parameter for the Adam optimizer.")
+    parser.add_argument("--adam_beta2", type=float, default=0.999, help="The beta2 parameter for the Adam optimizer.")
+    parser.add_argument("--adam_weight_decay", type=float, default=1e-2, help="Weight decay to use.")
+    parser.add_argument("--adam_epsilon", type=float, default=1e-08, help="Epsilon value for the Adam optimizer")
+    parser.add_argument("--max_grad_norm", default=1.0, type=float, help="Max gradient norm.")
+    parser.add_argument("--push_to_hub", action="store_true", help="Whether or not to push the model to the Hub.")
+    parser.add_argument("--hub_token", type=str, default=None, help="The token to use to push to the Model Hub.")
+    parser.add_argument(
+        "--prediction_type",
+        type=str,
+        default=None,
+        help="The prediction_type that shall be used for training. Choose between 'epsilon' or 'v_prediction' or leave `None`. If left to `None` the default prediction type of the scheduler: `noise_scheduler.config.prediction_type` is chosen.",
+    )
+    parser.add_argument(
+        "--hub_model_id",
+        type=str,
+        default=None,
+        help="The name of the repository to keep in sync with the local `output_dir`.",
+    )
+    parser.add_argument(
+        "--logging_dir",
+        type=str,
+        default="logs",
+        help=(
+            "[TensorBoard](https://www.tensorflow.org/tensorboard) log directory. Will default to"
+            " *output_dir/runs/**CURRENT_DATETIME_HOSTNAME***."
+        ),
+    )
+    parser.add_argument(
+        "--mixed_precision",
+        type=str,
+        default=None,
+        choices=["no", "fp16", "bf16"],
+        help=(
+            "Whether to use mixed precision. Choose between fp16 and bf16 (bfloat16). Bf16 requires PyTorch >="
+            " 1.10.and an Nvidia Ampere GPU.  Default to the value of accelerate config of the current system or the"
+            " flag passed with the `accelerate.launch` command. Use this argument to override the accelerate config."
+        ),
+    )
+    parser.add_argument(
+        "--report_to",
+        type=str,
+        default="tensorboard",
+        help=(
+            'The integration to report the results and logs to. Supported platforms are `"tensorboard"`'
+            ' (default), `"wandb"` and `"comet_ml"`. Use `"all"` to report to all integrations.'
+        ),
+    )
+    parser.add_argument("--local_rank", type=int, default=-1, help="For distributed training: local_rank")
+    parser.add_argument(
+        "--checkpointing_steps",
+        type=int,
+        default=500,
+        help=(
+            "Save a checkpoint of the training state every X updates. These checkpoints are only suitable for resuming"
+            " training using `--resume_from_checkpoint`."
+        ),
+    )
+    parser.add_argument(
+        "--checkpoints_total_limit",
+        type=int,
+        default=None,
+        help=("Max number of checkpoints to store."),
+    )
+    parser.add_argument(
+        "--resume_from_checkpoint",
+        type=str,
+        default=None,
+        help=(
+            "Whether training should be resumed from a previous checkpoint. Use a path saved by"
+            ' `--checkpointing_steps`, or `"latest"` to automatically select the last available checkpoint.'
+        ),
+    )
+    parser.add_argument(
+        "--enable_xformers_memory_efficient_attention", action="store_true", help="Whether or not to use xformers."
+    )
+    parser.add_argument("--noise_offset", type=float, default=0, help="The scale of noise offset.")
+    parser.add_argument(
+        "--validation_epochs",
+        type=int,
+        default=5,
+        help="Run validation every X epochs.",
+    )
+    parser.add_argument(
+        "--tracker_project_name",
+        type=str,
+        default="text2image-fine-tune",
+        help=(
+            "The `project_name` argument passed to Accelerator.init_trackers for"
+            " more information see https://huggingface.co/docs/accelerate/v0.17.0/en/package_reference/accelerator#accelerate.Accelerator"
+        ),
+    )
+    args = parser.parse_args()
+    env_local_rank = int(os.environ.get("LOCAL_RANK", -1))
+    if env_local_rank != -1 and env_local_rank != args.local_rank:
+        args.local_rank = env_local_rank
+    # Sanity checks
+    if args.dataset_name is None and args.train_data_dir is None:
+        raise ValueError("Need either a dataset name or a training folder.")
+    # default to using the same revision for the non-ema model if not specified
+    if args.non_ema_revision is None:
+        args.non_ema_revision = args.revision
+    return args
+def main():
+    args = parse_args()
+    if args.report_to == "wandb" and args.hub_token is not None:
+        raise ValueError(
+            "You cannot use both --report_to=wandb and --hub_token due to a security risk of exposing your token."
+            " Please use `huggingface-cli login` to authenticate with the Hub."
+        )
+    if args.non_ema_revision is not None:
+        deprecate(
+            "non_ema_revision!=None",
+            "0.15.0",
+            message=(
+                "Downloading 'non_ema' weights from revision branches of the Hub is deprecated. Please make sure to"
+                " use `--variant=non_ema` instead."
+            ),
+        )
+    logging_dir = os.path.join(args.output_dir, args.logging_dir)
+    accelerator_project_config = ProjectConfiguration(project_dir=args.output_dir, logging_dir=logging_dir)
+    accelerator = Accelerator(
+        gradient_accumulation_steps=args.gradient_accumulation_steps,
+        mixed_precision=args.mixed_precision,
+        log_with=args.report_to,
+        project_config=accelerator_project_config,
+    )
+    # Disable AMP for MPS.
+    if torch.backends.mps.is_available():
+        accelerator.native_amp = False
+    # Make one log on every process with the configuration for debugging.
+    logging.basicConfig(
+        format="%(asctime)s - %(levelname)s - %(name)s - %(message)s",
+        datefmt="%m/%d/%Y %H:%M:%S",
+        level=logging.INFO,
+    )
+    logger.info(accelerator.state, main_process_only=False)
+    if accelerator.is_local_main_process:
+        datasets.utils.logging.set_verbosity_warning()
+        transformers.utils.logging.set_verbosity_warning()
+        diffusers.utils.logging.set_verbosity_info()
+    else:
+        datasets.utils.logging.set_verbosity_error()
+        transformers.utils.logging.set_verbosity_error()
+        diffusers.utils.logging.set_verbosity_error()
+    # If passed along, set the training seed now.
+    if args.seed is not None:
+        set_seed(args.seed)
+    # Handle the repository creation
+    if accelerator.is_main_process:
+        if args.output_dir is not None:
+            os.makedirs(args.output_dir, exist_ok=True)
+        if args.push_to_hub:
+            repo_id = create_repo(
+                repo_id=args.hub_model_id or Path(args.output_dir).name, exist_ok=True, token=args.hub_token
+            ).repo_id
+    # Load scheduler, tokenizer and models.
+    noise_scheduler = DDPMScheduler.from_pretrained(args.pretrained_model_name_or_path, subfolder="scheduler")
+    tokenizer = CLIPTokenizer.from_pretrained(
+        args.pretrained_model_name_or_path, subfolder="tokenizer", revision=args.revision
+    )
+    def deepspeed_zero_init_disabled_context_manager():
+        """
+        returns either a context list that includes one that will disable zero.Init or an empty context list
+        """
+        deepspeed_plugin = AcceleratorState().deepspeed_plugin if accelerate.state.is_initialized() else None
+        if deepspeed_plugin is None:
+            return []
+        return [deepspeed_plugin.zero3_init_context_manager(enable=False)]
+    # Currently Accelerate doesn't know how to handle multiple models under Deepspeed ZeRO stage 3.
+    # For this to work properly all models must be run through `accelerate.prepare`. But accelerate
+    # will try to assign the same optimizer with the same weights to all models during
+    # `deepspeed.initialize`, which of course doesn't work.
+    #
+    # For now the following workaround will partially support Deepspeed ZeRO-3, by excluding the 2
+    # frozen models from being partitioned during `zero.Init` which gets called during
+    # `from_pretrained` So CLIPTextModel and AutoencoderKL will not enjoy the parameter sharding
+    # across multiple gpus and only UNet2DConditionModel will get ZeRO sharded.
+    with ContextManagers(deepspeed_zero_init_disabled_context_manager()):
+        text_encoder = CLIPTextModel.from_pretrained(
+            args.pretrained_model_name_or_path, subfolder="text_encoder", revision=args.revision, variant=args.variant
+        )
+        vae = AutoencoderKL.from_pretrained(
+            args.pretrained_model_name_or_path, subfolder="vae", revision=args.revision, variant=args.variant
+        )
+    unet = UNet2DConditionModel.from_pretrained(
+        args.pretrained_model_name_or_path, subfolder="unet", revision=args.non_ema_revision
+    )
+    # Freeze vae and text_encoder and set unet to trainable
+    vae.requires_grad_(False)
+    text_encoder.requires_grad_(False)
+    unet.train()
+    # Create EMA for the unet.
+    if args.use_ema:
+        ema_unet = UNet2DConditionModel.from_pretrained(
+            args.pretrained_model_name_or_path, subfolder="unet", revision=args.revision, variant=args.variant
+        )
+        ema_unet = EMAModel(
+            ema_unet.parameters(),
+            model_cls=UNet2DConditionModel,
+            model_config=ema_unet.config,
+            foreach=args.foreach_ema,
+        )
+    if args.enable_xformers_memory_efficient_attention:
+        if is_xformers_available():
+            import xformers
+            xformers_version = version.parse(xformers.__version__)
+            if xformers_version == version.parse("0.0.16"):
+                logger.warning(
+                    "xFormers 0.0.16 cannot be used for training in some GPUs. If you observe problems during training, please update xFormers to at least 0.0.17. See https://huggingface.co/docs/diffusers/main/en/optimization/xformers for more details."
+                )
+            unet.enable_xformers_memory_efficient_attention()
+        else:
+            raise ValueError("xformers is not available. Make sure it is installed correctly")
+    # `accelerate` 0.16.0 will have better support for customized saving
+    if version.parse(accelerate.__version__) >= version.parse("0.16.0"):
+        # create custom saving & loading hooks so that `accelerator.save_state(...)` serializes in a nice format
+        def save_model_hook(models, weights, output_dir):
+            if accelerator.is_main_process:
+                if args.use_ema:
+                    ema_unet.save_pretrained(os.path.join(output_dir, "unet_ema"))
+                for i, model in enumerate(models):
+                    model.save_pretrained(os.path.join(output_dir, "unet"))
+                    # make sure to pop weight so that corresponding model is not saved again
+                    weights.pop()
+        def load_model_hook(models, input_dir):
+            if args.use_ema:
+                load_model = EMAModel.from_pretrained(
+                    os.path.join(input_dir, "unet_ema"), UNet2DConditionModel, foreach=args.foreach_ema
+                )
+                ema_unet.load_state_dict(load_model.state_dict())
+                if args.offload_ema:
+                    ema_unet.pin_memory()
+                else:
+                    ema_unet.to(accelerator.device)
+                del load_model
+            for _ in range(len(models)):
+                # pop models so that they are not loaded again
+                model = models.pop()
+                # load diffusers style into model
+                load_model = UNet2DConditionModel.from_pretrained(input_dir, subfolder="unet")
+                model.register_to_config(**load_model.config)
+                model.load_state_dict(load_model.state_dict())
+                del load_model
+        accelerator.register_save_state_pre_hook(save_model_hook)
+        accelerator.register_load_state_pre_hook(load_model_hook)
+    if args.gradient_checkpointing:
+        unet.enable_gradient_checkpointing()
+    # Enable TF32 for faster training on Ampere GPUs,
+    # cf https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
+    if args.allow_tf32:
+        torch.backends.cuda.matmul.allow_tf32 = True
+    if args.scale_lr:
+        args.learning_rate = (
+            args.learning_rate * args.gradient_accumulation_steps * args.train_batch_size * accelerator.num_processes
+        )
+    # Initialize the optimizer
+    if args.use_8bit_adam:
+        try:
+            import bitsandbytes as bnb
+        except ImportError:
+            raise ImportError(
+                "Please install bitsandbytes to use 8-bit Adam. You can do so by running `pip install bitsandbytes`"
+            )
+        optimizer_cls = bnb.optim.AdamW8bit
+    else:
+        optimizer_cls = torch.optim.AdamW
+    optimizer = optimizer_cls(
+        unet.parameters(),
+        lr=args.learning_rate,
+        betas=(args.adam_beta1, args.adam_beta2),
+        weight_decay=args.adam_weight_decay,
+        eps=args.adam_epsilon,
+    )
+    # Get the datasets: you can either provide your own training and evaluation files (see below)
+    # or specify a Dataset from the hub (the dataset will be downloaded automatically from the datasets Hub).
+    # In distributed training, the load_dataset function guarantees that only one local process can concurrently
+    # download the dataset.
+    if args.dataset_name is not None:
+        # Downloading and loading a dataset from the hub.
+        dataset = load_dataset(
+            args.dataset_name,
+            args.dataset_config_name,
+            cache_dir=args.cache_dir,
+            data_dir=args.train_data_dir,
+        )
+    else:
+        data_files = {}
+        if args.train_data_dir is not None:
+            data_files["train"] = os.path.join(args.train_data_dir, "**")
+        dataset = load_dataset(
+            "imagefolder",
+            data_files=data_files,
+            cache_dir=args.cache_dir,
+        )
+        # See more about loading custom images at
+        # https://huggingface.co/docs/datasets/v2.4.0/en/image_load#imagefolder
+    # Preprocessing the datasets.
+    # We need to tokenize inputs and targets.
+    column_names = dataset["train"].column_names
+    # 6. Get the column names for input/target.
+    dataset_columns = DATASET_NAME_MAPPING.get(args.dataset_name, None)
+    if args.image_column is None:
+        image_column = dataset_columns[0] if dataset_columns is not None else column_names[0]
+    else:
+        image_column = args.image_column
+        if image_column not in column_names:
+            raise ValueError(
+                f"--image_column' value '{args.image_column}' needs to be one of: {', '.join(column_names)}"
+            )
+    if args.caption_column is None:
+        caption_column = dataset_columns[1] if dataset_columns is not None else column_names[1]
+    else:
+        caption_column = args.caption_column
+        if caption_column not in column_names:
+            raise ValueError(
+                f"--caption_column' value '{args.caption_column}' needs to be one of: {', '.join(column_names)}"
+            )
+    # Preprocessing the datasets.
+    # We need to tokenize input captions and transform the images.
+    def tokenize_captions(examples, is_train=True):
+        captions = []
+        for caption in examples[caption_column]:
+            if isinstance(caption, str):
+                captions.append(caption)
+            elif isinstance(caption, (list, np.ndarray)):
+                # take a random caption if there are multiple
+                captions.append(random.choice(caption) if is_train else caption[0])
+            else:
+                raise ValueError(
+                    f"Caption column `{caption_column}` should contain either strings or lists of strings."
+                )
+        inputs = tokenizer(
+            captions, max_length=tokenizer.model_max_length, padding="max_length", truncation=True, return_tensors="pt"
+        )
+        return inputs.input_ids
+    # Preprocessing the datasets.
+    train_transforms = transforms.Compose(
+        [
+            transforms.Resize(args.resolution, interpolation=transforms.InterpolationMode.BILINEAR),
+            transforms.CenterCrop(args.resolution) if args.center_crop else transforms.RandomCrop(args.resolution),
+            transforms.RandomHorizontalFlip() if args.random_flip else transforms.Lambda(lambda x: x),
+            transforms.ToTensor(),
+            transforms.Normalize([0.5], [0.5]),
+        ]
+    )
+    def preprocess_train(examples):
+        images = [image.convert("RGB") for image in examples[image_column]]
+        examples["pixel_values"] = [train_transforms(image) for image in images]
+        examples["input_ids"] = tokenize_captions(examples)
+        return examples
+    with accelerator.main_process_first():
+        if args.max_train_samples is not None:
+            dataset["train"] = dataset["train"].shuffle(seed=args.seed).select(range(args.max_train_samples))
+        # Set the training transforms
+        train_dataset = dataset["train"].with_transform(preprocess_train)
+    def collate_fn(examples):
+        pixel_values = torch.stack([example["pixel_values"] for example in examples])
+        pixel_values = pixel_values.to(memory_format=torch.contiguous_format).float()
+        input_ids = torch.stack([example["input_ids"] for example in examples])
+        return {"pixel_values": pixel_values, "input_ids": input_ids}
+    # DataLoaders creation:
+    train_dataloader = torch.utils.data.DataLoader(
+        train_dataset,
+        shuffle=True,
+        collate_fn=collate_fn,
+        batch_size=args.train_batch_size,
+        num_workers=args.dataloader_num_workers,
+    )
+    # Scheduler and math around the number of training steps.
+    # Check the PR https://github.com/huggingface/diffusers/pull/8312 for detailed explanation.
+    num_warmup_steps_for_scheduler = args.lr_warmup_steps * accelerator.num_processes
+    if args.max_train_steps is None:
+        len_train_dataloader_after_sharding = math.ceil(len(train_dataloader) / accelerator.num_processes)
+        num_update_steps_per_epoch = math.ceil(len_train_dataloader_after_sharding / args.gradient_accumulation_steps)
+        num_training_steps_for_scheduler = (
+            args.num_train_epochs * num_update_steps_per_epoch * accelerator.num_processes
+        )
+    else:
+        num_training_steps_for_scheduler = args.max_train_steps * accelerator.num_processes
+    lr_scheduler = get_scheduler(
+        args.lr_scheduler,
+        optimizer=optimizer,
+        num_warmup_steps=num_warmup_steps_for_scheduler,
+        num_training_steps=num_training_steps_for_scheduler,
+    )
+    # Prepare everything with our `accelerator`.
+    unet, optimizer, train_dataloader, lr_scheduler = accelerator.prepare(
+        unet, optimizer, train_dataloader, lr_scheduler
+    )
+    if args.use_ema:
+        if args.offload_ema:
+            ema_unet.pin_memory()
+        else:
+            ema_unet.to(accelerator.device)
+    # For mixed precision training we cast all non-trainable weights (vae, non-lora text_encoder and non-lora unet) to half-precision
+    # as these weights are only used for inference, keeping weights in full precision is not required.
+    weight_dtype = torch.float32
+    if accelerator.mixed_precision == "fp16":
+        weight_dtype = torch.float16
+        args.mixed_precision = accelerator.mixed_precision
+    elif accelerator.mixed_precision == "bf16":
+        weight_dtype = torch.bfloat16
+        args.mixed_precision = accelerator.mixed_precision
+    # Move text_encode and vae to gpu and cast to weight_dtype
+    text_encoder.to(accelerator.device, dtype=weight_dtype)
+    vae.to(accelerator.device, dtype=weight_dtype)
+    # We need to recalculate our total training steps as the size of the training dataloader may have changed.
+    num_update_steps_per_epoch = math.ceil(len(train_dataloader) / args.gradient_accumulation_steps)
+    if args.max_train_steps is None:
+        args.max_train_steps = args.num_train_epochs * num_update_steps_per_epoch
+        if num_training_steps_for_scheduler != args.max_train_steps * accelerator.num_processes:
+            logger.warning(
+                f"The length of the 'train_dataloader' after 'accelerator.prepare' ({len(train_dataloader)}) does not match "
+                f"the expected length ({len_train_dataloader_after_sharding}) when the learning rate scheduler was created. "
+                f"This inconsistency may result in the learning rate scheduler not functioning properly."
+            )
+    # Afterwards we recalculate our number of training epochs
+    args.num_train_epochs = math.ceil(args.max_train_steps / num_update_steps_per_epoch)
+    # We need to initialize the trackers we use, and also store our configuration.
+    # The trackers initializes automatically on the main process.
+    if accelerator.is_main_process:
+        tracker_config = dict(vars(args))
+        tracker_config.pop("validation_prompts")
+        accelerator.init_trackers(args.tracker_project_name, tracker_config)
+    # Function for unwrapping if model was compiled with `torch.compile`.
+    def unwrap_model(model):
+        model = accelerator.unwrap_model(model)
+        model = model._orig_mod if is_compiled_module(model) else model
+        return model
+    # Train!
+    total_batch_size = args.train_batch_size * accelerator.num_processes * args.gradient_accumulation_steps
+    logger.info("***** Running training *****")
+    logger.info(f"  Num examples = {len(train_dataset)}")
+    logger.info(f"  Num Epochs = {args.num_train_epochs}")
+    logger.info(f"  Instantaneous batch size per device = {args.train_batch_size}")
+    logger.info(f"  Total train batch size (w. parallel, distributed & accumulation) = {total_batch_size}")
+    logger.info(f"  Gradient Accumulation steps = {args.gradient_accumulation_steps}")
+    logger.info(f"  Total optimization steps = {args.max_train_steps}")
+    global_step = 0
+    first_epoch = 0
+    # Potentially load in the weights and states from a previous save
+    if args.resume_from_checkpoint:
+        if args.resume_from_checkpoint != "latest":
+            path = os.path.basename(args.resume_from_checkpoint)
+        else:
+            # Get the most recent checkpoint
+            dirs = os.listdir(args.output_dir)
+            dirs = [d for d in dirs if d.startswith("checkpoint")]
+            dirs = sorted(dirs, key=lambda x: int(x.split("-")[1]))
+            path = dirs[-1] if len(dirs) > 0 else None
+        if path is None:
+            accelerator.print(
+                f"Checkpoint '{args.resume_from_checkpoint}' does not exist. Starting a new training run."
+            )
+            args.resume_from_checkpoint = None
+            initial_global_step = 0
+        else:
+            accelerator.print(f"Resuming from checkpoint {path}")
+            accelerator.load_state(os.path.join(args.output_dir, path))
+            global_step = int(path.split("-")[1])
+            initial_global_step = global_step
+            first_epoch = global_step // num_update_steps_per_epoch
+    else:
+        initial_global_step = 0
+    progress_bar = tqdm(
+        range(0, args.max_train_steps),
+        initial=initial_global_step,
+        desc="Steps",
+        # Only show the progress bar once on each machine.
+        disable=not accelerator.is_local_main_process,
+    )
+    for epoch in range(first_epoch, args.num_train_epochs):
+        train_loss = 0.0
+        for step, batch in enumerate(train_dataloader):
+            with accelerator.accumulate(unet):
+                # Convert images to latent space
+                latents = vae.encode(batch["pixel_values"].to(weight_dtype)).latent_dist.sample()
+                latents = latents * vae.config.scaling_factor
+                # Sample noise that we'll add to the latents
+                noise = torch.randn_like(latents)
+                if args.noise_offset:
+                    # https://www.crosslabs.org//blog/diffusion-with-offset-noise
+                    noise += args.noise_offset * torch.randn(
+                        (latents.shape[0], latents.shape[1], 1, 1), device=latents.device
+                    )
+                if args.input_perturbation:
+                    new_noise = noise + args.input_perturbation * torch.randn_like(noise)
+                bsz = latents.shape[0]
+                # Sample a random timestep for each image
+                timesteps = torch.randint(0, noise_scheduler.config.num_train_timesteps, (bsz,), device=latents.device)
+                timesteps = timesteps.long()
+                # Add noise to the latents according to the noise magnitude at each timestep
+                # (this is the forward diffusion process)
+                if args.input_perturbation:
+                    noisy_latents = noise_scheduler.add_noise(latents, new_noise, timesteps)
+                else:
+                    noisy_latents = noise_scheduler.add_noise(latents, noise, timesteps)
+                # Get the text embedding for conditioning
+                encoder_hidden_states = text_encoder(batch["input_ids"], return_dict=False)[0]
+                # Get the target for loss depending on the prediction type
+                if args.prediction_type is not None:
+                    # set prediction_type of scheduler if defined
+                    noise_scheduler.register_to_config(prediction_type=args.prediction_type)
+                if noise_scheduler.config.prediction_type == "epsilon":
+                    target = noise
+                elif noise_scheduler.config.prediction_type == "v_prediction":
+                    target = noise_scheduler.get_velocity(latents, noise, timesteps)
+                else:
+                    raise ValueError(f"Unknown prediction type {noise_scheduler.config.prediction_type}")
+                if args.dream_training:
+                    noisy_latents, target = compute_dream_and_update_latents(
+                        unet,
+                        noise_scheduler,
+                        timesteps,
+                        noise,
+                        noisy_latents,
+                        target,
+                        encoder_hidden_states,
+                        args.dream_detail_preservation,
+                    )
+                # Predict the noise residual and compute loss
+                model_pred = unet(noisy_latents, timesteps, encoder_hidden_states, return_dict=False)[0]
+                if args.snr_gamma is None:
+                    loss = F.mse_loss(model_pred.float(), target.float(), reduction="mean")
+                else:
+                    # Compute loss-weights as per Section 3.4 of https://arxiv.org/abs/2303.09556.
+                    # Since we predict the noise instead of x_0, the original formulation is slightly changed.
+                    # This is discussed in Section 4.2 of the same paper.
+                    snr = compute_snr(noise_scheduler, timesteps)
+                    mse_loss_weights = torch.stack([snr, args.snr_gamma * torch.ones_like(timesteps)], dim=1).min(
+                        dim=1
+                    )[0]
+                    if noise_scheduler.config.prediction_type == "epsilon":
+                        mse_loss_weights = mse_loss_weights / snr
+                    elif noise_scheduler.config.prediction_type == "v_prediction":
+                        mse_loss_weights = mse_loss_weights / (snr + 1)
+                    loss = F.mse_loss(model_pred.float(), target.float(), reduction="none")
+                    loss = loss.mean(dim=list(range(1, len(loss.shape)))) * mse_loss_weights
+                    loss = loss.mean()
+                #Flipping sign for gradient ascent
+                loss = -loss
+                # Gather the losses across all processes for logging (if we use distributed training).
+                avg_loss = accelerator.gather(loss.repeat(args.train_batch_size)).mean()
+                train_loss += avg_loss.item() / args.gradient_accumulation_steps
+                # Backpropagate
+                accelerator.backward(loss)
+                if accelerator.sync_gradients:
+                    accelerator.clip_grad_norm_(unet.parameters(), args.max_grad_norm)
+                optimizer.step()
+                lr_scheduler.step()
+                optimizer.zero_grad()
+            # Checks if the accelerator has performed an optimization step behind the scenes
+            if accelerator.sync_gradients:
+                if args.use_ema:
+                    if args.offload_ema:
+                        ema_unet.to(device="cuda", non_blocking=True)
+                    ema_unet.step(unet.parameters())
+                    if args.offload_ema:
+                        ema_unet.to(device="cpu", non_blocking=True)
+                progress_bar.update(1)
+                global_step += 1
+                accelerator.log({"train_loss": train_loss}, step=global_step)
+                train_loss = 0.0
+                if global_step % args.checkpointing_steps == 0:
+                    if accelerator.is_main_process:
+                        # _before_ saving state, check if this save would set us over the `checkpoints_total_limit`
+                        if args.checkpoints_total_limit is not None:
+                            checkpoints = os.listdir(args.output_dir)
+                            checkpoints = [d for d in checkpoints if d.startswith("checkpoint")]
+                            checkpoints = sorted(checkpoints, key=lambda x: int(x.split("-")[1]))
+                            # before we save the new checkpoint, we need to have at _most_ `checkpoints_total_limit - 1` checkpoints
+                            if len(checkpoints) >= args.checkpoints_total_limit:
+                                num_to_remove = len(checkpoints) - args.checkpoints_total_limit + 1
+                                removing_checkpoints = checkpoints[0:num_to_remove]
+                                logger.info(
+                                    f"{len(checkpoints)} checkpoints already exist, removing {len(removing_checkpoints)} checkpoints"
+                                )
+                                logger.info(f"removing checkpoints: {', '.join(removing_checkpoints)}")
+                                for removing_checkpoint in removing_checkpoints:
+                                    removing_checkpoint = os.path.join(args.output_dir, removing_checkpoint)
+                                    shutil.rmtree(removing_checkpoint)
+                        save_path = os.path.join(args.output_dir, f"checkpoint-{global_step}")
+                        accelerator.save_state(save_path)
+                        logger.info(f"Saved state to {save_path}")
+            logs = {"step_loss": loss.detach().item(), "lr": lr_scheduler.get_last_lr()[0]}
+            progress_bar.set_postfix(**logs)
+            if global_step >= args.max_train_steps:
+                break
+        if accelerator.is_main_process:
+            if args.validation_prompts is not None and epoch % args.validation_epochs == 0:
+                if args.use_ema:
+                    # Store the UNet parameters temporarily and load the EMA parameters to perform inference.
+                    ema_unet.store(unet.parameters())
+                    ema_unet.copy_to(unet.parameters())
+                log_validation(
+                    vae,
+                    text_encoder,
+                    tokenizer,
+                    unet,
+                    args,
+                    accelerator,
+                    weight_dtype,
+                    global_step,
+                )
+                if args.use_ema:
+                    # Switch back to the original UNet parameters.
+                    ema_unet.restore(unet.parameters())
+    # Create the pipeline using the trained modules and save it.
+    accelerator.wait_for_everyone()
+    if accelerator.is_main_process:
+        unet = unwrap_model(unet)
+        if args.use_ema:
+            ema_unet.copy_to(unet.parameters())
+        pipeline = StableDiffusionPipeline.from_pretrained(
+            args.pretrained_model_name_or_path,
+            text_encoder=text_encoder,
+            vae=vae,
+            unet=unet,
+            revision=args.revision,
+            variant=args.variant,
+        )
+        pipeline.save_pretrained(args.output_dir)
+        # Run a final round of inference.
+        images = []
+        if args.validation_prompts is not None:
+            logger.info("Running inference for collecting generated images...")
+            pipeline = pipeline.to(accelerator.device)
+            pipeline.torch_dtype = weight_dtype
+            pipeline.set_progress_bar_config(disable=True)
+            if args.enable_xformers_memory_efficient_attention:
+                pipeline.enable_xformers_memory_efficient_attention()
+            if args.seed is None:
+                generator = None
+            else:
+                generator = torch.Generator(device=accelerator.device).manual_seed(args.seed)
+            for i in range(len(args.validation_prompts)):
+                with torch.autocast("cuda"):
+                    image = pipeline(args.validation_prompts[i], num_inference_steps=20, generator=generator).images[0]
+                images.append(image)
+        if args.push_to_hub:
+            save_model_card(args, repo_id, images, repo_folder=args.output_dir)
+            upload_folder(
+                repo_id=repo_id,
+                folder_path=args.output_dir,
+                commit_message="End of training",
+                ignore_patterns=["step_*", "epoch_*"],
+            )
+    accelerator.end_training()
+if __name__ == "__main__":
+    main()

metadata.jsonl ADDED Viewed

	@@ -0,0 +1,1000 @@

+{"file_name": "train/1.jpg", "text": "a car"}
+{"file_name": "train/2.jpg", "text": "a car"}
+{"file_name": "train/3.jpg", "text": "a car"}
+{"file_name": "train/4.jpg", "text": "a car"}
+{"file_name": "train/5.jpg", "text": "a car"}
+{"file_name": "train/6.jpg", "text": "a car"}
+{"file_name": "train/7.jpg", "text": "a car"}
+{"file_name": "train/8.jpg", "text": "a car"}
+{"file_name": "train/9.jpg", "text": "a car"}
+{"file_name": "train/10.jpg", "text": "a car"}
+{"file_name": "train/11.jpg", "text": "a car"}
+{"file_name": "train/12.jpg", "text": "a car"}
+{"file_name": "train/13.jpg", "text": "a car"}
+{"file_name": "train/14.jpg", "text": "a car"}
+{"file_name": "train/15.jpg", "text": "a car"}
+{"file_name": "train/16.jpg", "text": "a car"}
+{"file_name": "train/17.jpg", "text": "a car"}
+{"file_name": "train/18.jpg", "text": "a car"}
+{"file_name": "train/19.jpg", "text": "a car"}
+{"file_name": "train/20.jpg", "text": "a car"}
+{"file_name": "train/21.jpg", "text": "a car"}
+{"file_name": "train/22.jpg", "text": "a car"}
+{"file_name": "train/23.jpg", "text": "a car"}
+{"file_name": "train/24.jpg", "text": "a car"}
+{"file_name": "train/25.jpg", "text": "a car"}
+{"file_name": "train/26.jpg", "text": "a car"}
+{"file_name": "train/27.jpg", "text": "a car"}
+{"file_name": "train/28.jpg", "text": "a car"}
+{"file_name": "train/29.jpg", "text": "a car"}
+{"file_name": "train/30.jpg", "text": "a car"}
+{"file_name": "train/31.jpg", "text": "a car"}
+{"file_name": "train/32.jpg", "text": "a car"}
+{"file_name": "train/33.jpg", "text": "a car"}
+{"file_name": "train/34.jpg", "text": "a car"}
+{"file_name": "train/35.jpg", "text": "a car"}
+{"file_name": "train/36.jpg", "text": "a car"}
+{"file_name": "train/37.jpg", "text": "a car"}
+{"file_name": "train/38.jpg", "text": "a car"}
+{"file_name": "train/39.jpg", "text": "a car"}
+{"file_name": "train/40.jpg", "text": "a car"}
+{"file_name": "train/41.jpg", "text": "a car"}
+{"file_name": "train/42.jpg", "text": "a car"}
+{"file_name": "train/43.jpg", "text": "a car"}
+{"file_name": "train/44.jpg", "text": "a car"}
+{"file_name": "train/45.jpg", "text": "a car"}
+{"file_name": "train/46.jpg", "text": "a car"}
+{"file_name": "train/47.jpg", "text": "a car"}
+{"file_name": "train/48.jpg", "text": "a car"}
+{"file_name": "train/49.jpg", "text": "a car"}
+{"file_name": "train/50.jpg", "text": "a car"}
+{"file_name": "train/51.jpg", "text": "a car"}
+{"file_name": "train/52.jpg", "text": "a car"}
+{"file_name": "train/53.jpg", "text": "a car"}
+{"file_name": "train/54.jpg", "text": "a car"}
+{"file_name": "train/55.jpg", "text": "a car"}
+{"file_name": "train/56.jpg", "text": "a car"}
+{"file_name": "train/57.jpg", "text": "a car"}
+{"file_name": "train/58.jpg", "text": "a car"}
+{"file_name": "train/59.jpg", "text": "a car"}
+{"file_name": "train/60.jpg", "text": "a car"}
+{"file_name": "train/61.jpg", "text": "a car"}
+{"file_name": "train/62.jpg", "text": "a car"}
+{"file_name": "train/63.jpg", "text": "a car"}
+{"file_name": "train/64.jpg", "text": "a car"}
+{"file_name": "train/65.jpg", "text": "a car"}
+{"file_name": "train/66.jpg", "text": "a car"}
+{"file_name": "train/67.jpg", "text": "a car"}
+{"file_name": "train/68.jpg", "text": "a car"}
+{"file_name": "train/69.jpg", "text": "a car"}
+{"file_name": "train/70.jpg", "text": "a car"}
+{"file_name": "train/71.jpg", "text": "a car"}
+{"file_name": "train/72.jpg", "text": "a car"}
+{"file_name": "train/73.jpg", "text": "a car"}
+{"file_name": "train/74.jpg", "text": "a car"}
+{"file_name": "train/75.jpg", "text": "a car"}
+{"file_name": "train/76.jpg", "text": "a car"}
+{"file_name": "train/77.jpg", "text": "a car"}
+{"file_name": "train/78.jpg", "text": "a car"}
+{"file_name": "train/79.jpg", "text": "a car"}
+{"file_name": "train/80.jpg", "text": "a car"}
+{"file_name": "train/81.jpg", "text": "a car"}
+{"file_name": "train/82.jpg", "text": "a car"}
+{"file_name": "train/83.jpg", "text": "a car"}
+{"file_name": "train/84.jpg", "text": "a car"}
+{"file_name": "train/85.jpg", "text": "a car"}
+{"file_name": "train/86.jpg", "text": "a car"}
+{"file_name": "train/87.jpg", "text": "a car"}
+{"file_name": "train/88.jpg", "text": "a car"}
+{"file_name": "train/89.jpg", "text": "a car"}
+{"file_name": "train/90.jpg", "text": "a car"}
+{"file_name": "train/91.jpg", "text": "a car"}
+{"file_name": "train/92.jpg", "text": "a car"}
+{"file_name": "train/93.jpg", "text": "a car"}
+{"file_name": "train/94.jpg", "text": "a car"}
+{"file_name": "train/95.jpg", "text": "a car"}
+{"file_name": "train/96.jpg", "text": "a car"}
+{"file_name": "train/97.jpg", "text": "a car"}
+{"file_name": "train/98.jpg", "text": "a car"}
+{"file_name": "train/99.jpg", "text": "a car"}
+{"file_name": "train/100.jpg", "text": "a car"}
+{"file_name": "train/101.jpg", "text": "a car"}
+{"file_name": "train/102.jpg", "text": "a car"}
+{"file_name": "train/103.jpg", "text": "a car"}
+{"file_name": "train/104.jpg", "text": "a car"}
+{"file_name": "train/105.jpg", "text": "a car"}
+{"file_name": "train/106.jpg", "text": "a car"}
+{"file_name": "train/107.jpg", "text": "a car"}
+{"file_name": "train/108.jpg", "text": "a car"}
+{"file_name": "train/109.jpg", "text": "a car"}
+{"file_name": "train/110.jpg", "text": "a car"}
+{"file_name": "train/111.jpg", "text": "a car"}
+{"file_name": "train/112.jpg", "text": "a car"}
+{"file_name": "train/113.jpg", "text": "a car"}
+{"file_name": "train/114.jpg", "text": "a car"}
+{"file_name": "train/115.jpg", "text": "a car"}
+{"file_name": "train/116.jpg", "text": "a car"}
+{"file_name": "train/117.jpg", "text": "a car"}
+{"file_name": "train/118.jpg", "text": "a car"}
+{"file_name": "train/119.jpg", "text": "a car"}
+{"file_name": "train/120.jpg", "text": "a car"}
+{"file_name": "train/121.jpg", "text": "a car"}
+{"file_name": "train/122.jpg", "text": "a car"}
+{"file_name": "train/123.jpg", "text": "a car"}
+{"file_name": "train/124.jpg", "text": "a car"}
+{"file_name": "train/125.jpg", "text": "a car"}
+{"file_name": "train/126.jpg", "text": "a car"}
+{"file_name": "train/127.jpg", "text": "a car"}
+{"file_name": "train/128.jpg", "text": "a car"}
+{"file_name": "train/129.jpg", "text": "a car"}
+{"file_name": "train/130.jpg", "text": "a car"}
+{"file_name": "train/131.jpg", "text": "a car"}
+{"file_name": "train/132.jpg", "text": "a car"}
+{"file_name": "train/133.jpg", "text": "a car"}
+{"file_name": "train/134.jpg", "text": "a car"}
+{"file_name": "train/135.jpg", "text": "a car"}
+{"file_name": "train/136.jpg", "text": "a car"}
+{"file_name": "train/137.jpg", "text": "a car"}
+{"file_name": "train/138.jpg", "text": "a car"}
+{"file_name": "train/139.jpg", "text": "a car"}
+{"file_name": "train/140.jpg", "text": "a car"}
+{"file_name": "train/141.jpg", "text": "a car"}
+{"file_name": "train/142.jpg", "text": "a car"}
+{"file_name": "train/143.jpg", "text": "a car"}
+{"file_name": "train/144.jpg", "text": "a car"}
+{"file_name": "train/145.jpg", "text": "a car"}
+{"file_name": "train/146.jpg", "text": "a car"}
+{"file_name": "train/147.jpg", "text": "a car"}
+{"file_name": "train/148.jpg", "text": "a car"}
+{"file_name": "train/149.jpg", "text": "a car"}
+{"file_name": "train/150.jpg", "text": "a car"}
+{"file_name": "train/151.jpg", "text": "a car"}
+{"file_name": "train/152.jpg", "text": "a car"}
+{"file_name": "train/153.jpg", "text": "a car"}
+{"file_name": "train/154.jpg", "text": "a car"}
+{"file_name": "train/155.jpg", "text": "a car"}
+{"file_name": "train/156.jpg", "text": "a car"}
+{"file_name": "train/157.jpg", "text": "a car"}
+{"file_name": "train/158.jpg", "text": "a car"}
+{"file_name": "train/159.jpg", "text": "a car"}
+{"file_name": "train/160.jpg", "text": "a car"}
+{"file_name": "train/161.jpg", "text": "a car"}
+{"file_name": "train/162.jpg", "text": "a car"}
+{"file_name": "train/163.jpg", "text": "a car"}
+{"file_name": "train/164.jpg", "text": "a car"}
+{"file_name": "train/165.jpg", "text": "a car"}
+{"file_name": "train/166.jpg", "text": "a car"}
+{"file_name": "train/167.jpg", "text": "a car"}
+{"file_name": "train/168.jpg", "text": "a car"}
+{"file_name": "train/169.jpg", "text": "a car"}
+{"file_name": "train/170.jpg", "text": "a car"}
+{"file_name": "train/171.jpg", "text": "a car"}
+{"file_name": "train/172.jpg", "text": "a car"}
+{"file_name": "train/173.jpg", "text": "a car"}
+{"file_name": "train/174.jpg", "text": "a car"}
+{"file_name": "train/175.jpg", "text": "a car"}
+{"file_name": "train/176.jpg", "text": "a car"}
+{"file_name": "train/177.jpg", "text": "a car"}
+{"file_name": "train/178.jpg", "text": "a car"}
+{"file_name": "train/179.jpg", "text": "a car"}
+{"file_name": "train/180.jpg", "text": "a car"}
+{"file_name": "train/181.jpg", "text": "a car"}
+{"file_name": "train/182.jpg", "text": "a car"}
+{"file_name": "train/183.jpg", "text": "a car"}
+{"file_name": "train/184.jpg", "text": "a car"}
+{"file_name": "train/185.jpg", "text": "a car"}
+{"file_name": "train/186.jpg", "text": "a car"}
+{"file_name": "train/187.jpg", "text": "a car"}
+{"file_name": "train/188.jpg", "text": "a car"}
+{"file_name": "train/189.jpg", "text": "a car"}
+{"file_name": "train/190.jpg", "text": "a car"}
+{"file_name": "train/191.jpg", "text": "a car"}
+{"file_name": "train/192.jpg", "text": "a car"}
+{"file_name": "train/193.jpg", "text": "a car"}
+{"file_name": "train/194.jpg", "text": "a car"}
+{"file_name": "train/195.jpg", "text": "a car"}
+{"file_name": "train/196.jpg", "text": "a car"}
+{"file_name": "train/197.jpg", "text": "a car"}
+{"file_name": "train/198.jpg", "text": "a car"}
+{"file_name": "train/199.jpg", "text": "a car"}
+{"file_name": "train/200.jpg", "text": "a car"}
+{"file_name": "train/201.jpg", "text": "a car"}
+{"file_name": "train/202.jpg", "text": "a car"}
+{"file_name": "train/203.jpg", "text": "a car"}
+{"file_name": "train/204.jpg", "text": "a car"}
+{"file_name": "train/205.jpg", "text": "a car"}
+{"file_name": "train/206.jpg", "text": "a car"}
+{"file_name": "train/207.jpg", "text": "a car"}
+{"file_name": "train/208.jpg", "text": "a car"}
+{"file_name": "train/209.jpg", "text": "a car"}
+{"file_name": "train/210.jpg", "text": "a car"}
+{"file_name": "train/211.jpg", "text": "a car"}
+{"file_name": "train/212.jpg", "text": "a car"}
+{"file_name": "train/213.jpg", "text": "a car"}
+{"file_name": "train/214.jpg", "text": "a car"}
+{"file_name": "train/215.jpg", "text": "a car"}
+{"file_name": "train/216.jpg", "text": "a car"}
+{"file_name": "train/217.jpg", "text": "a car"}
+{"file_name": "train/218.jpg", "text": "a car"}
+{"file_name": "train/219.jpg", "text": "a car"}
+{"file_name": "train/220.jpg", "text": "a car"}
+{"file_name": "train/221.jpg", "text": "a car"}
+{"file_name": "train/222.jpg", "text": "a car"}
+{"file_name": "train/223.jpg", "text": "a car"}
+{"file_name": "train/224.jpg", "text": "a car"}
+{"file_name": "train/225.jpg", "text": "a car"}
+{"file_name": "train/226.jpg", "text": "a car"}
+{"file_name": "train/227.jpg", "text": "a car"}
+{"file_name": "train/228.jpg", "text": "a car"}
+{"file_name": "train/229.jpg", "text": "a car"}
+{"file_name": "train/230.jpg", "text": "a car"}
+{"file_name": "train/231.jpg", "text": "a car"}
+{"file_name": "train/232.jpg", "text": "a car"}
+{"file_name": "train/233.jpg", "text": "a car"}
+{"file_name": "train/234.jpg", "text": "a car"}
+{"file_name": "train/235.jpg", "text": "a car"}
+{"file_name": "train/236.jpg", "text": "a car"}
+{"file_name": "train/237.jpg", "text": "a car"}
+{"file_name": "train/238.jpg", "text": "a car"}
+{"file_name": "train/239.jpg", "text": "a car"}
+{"file_name": "train/240.jpg", "text": "a car"}
+{"file_name": "train/241.jpg", "text": "a car"}
+{"file_name": "train/242.jpg", "text": "a car"}
+{"file_name": "train/243.jpg", "text": "a car"}
+{"file_name": "train/244.jpg", "text": "a car"}
+{"file_name": "train/245.jpg", "text": "a car"}
+{"file_name": "train/246.jpg", "text": "a car"}
+{"file_name": "train/247.jpg", "text": "a car"}
+{"file_name": "train/248.jpg", "text": "a car"}
+{"file_name": "train/249.jpg", "text": "a car"}
+{"file_name": "train/250.jpg", "text": "a car"}
+{"file_name": "train/251.jpg", "text": "a car"}
+{"file_name": "train/252.jpg", "text": "a car"}
+{"file_name": "train/253.jpg", "text": "a car"}
+{"file_name": "train/254.jpg", "text": "a car"}
+{"file_name": "train/255.jpg", "text": "a car"}
+{"file_name": "train/256.jpg", "text": "a car"}
+{"file_name": "train/257.jpg", "text": "a car"}
+{"file_name": "train/258.jpg", "text": "a car"}
+{"file_name": "train/259.jpg", "text": "a car"}
+{"file_name": "train/260.jpg", "text": "a car"}
+{"file_name": "train/261.jpg", "text": "a car"}
+{"file_name": "train/262.jpg", "text": "a car"}
+{"file_name": "train/263.jpg", "text": "a car"}
+{"file_name": "train/264.jpg", "text": "a car"}
+{"file_name": "train/265.jpg", "text": "a car"}
+{"file_name": "train/266.jpg", "text": "a car"}
+{"file_name": "train/267.jpg", "text": "a car"}
+{"file_name": "train/268.jpg", "text": "a car"}
+{"file_name": "train/269.jpg", "text": "a car"}
+{"file_name": "train/270.jpg", "text": "a car"}
+{"file_name": "train/271.jpg", "text": "a car"}
+{"file_name": "train/272.jpg", "text": "a car"}
+{"file_name": "train/273.jpg", "text": "a car"}
+{"file_name": "train/274.jpg", "text": "a car"}
+{"file_name": "train/275.jpg", "text": "a car"}
+{"file_name": "train/276.jpg", "text": "a car"}
+{"file_name": "train/277.jpg", "text": "a car"}
+{"file_name": "train/278.jpg", "text": "a car"}
+{"file_name": "train/279.jpg", "text": "a car"}
+{"file_name": "train/280.jpg", "text": "a car"}
+{"file_name": "train/281.jpg", "text": "a car"}
+{"file_name": "train/282.jpg", "text": "a car"}
+{"file_name": "train/283.jpg", "text": "a car"}
+{"file_name": "train/284.jpg", "text": "a car"}
+{"file_name": "train/285.jpg", "text": "a car"}
+{"file_name": "train/286.jpg", "text": "a car"}
+{"file_name": "train/287.jpg", "text": "a car"}
+{"file_name": "train/288.jpg", "text": "a car"}
+{"file_name": "train/289.jpg", "text": "a car"}
+{"file_name": "train/290.jpg", "text": "a car"}
+{"file_name": "train/291.jpg", "text": "a car"}
+{"file_name": "train/292.jpg", "text": "a car"}
+{"file_name": "train/293.jpg", "text": "a car"}
+{"file_name": "train/294.jpg", "text": "a car"}
+{"file_name": "train/295.jpg", "text": "a car"}
+{"file_name": "train/296.jpg", "text": "a car"}
+{"file_name": "train/297.jpg", "text": "a car"}
+{"file_name": "train/298.jpg", "text": "a car"}
+{"file_name": "train/299.jpg", "text": "a car"}
+{"file_name": "train/300.jpg", "text": "a car"}
+{"file_name": "train/301.jpg", "text": "a car"}
+{"file_name": "train/302.jpg", "text": "a car"}
+{"file_name": "train/303.jpg", "text": "a car"}
+{"file_name": "train/304.jpg", "text": "a car"}
+{"file_name": "train/305.jpg", "text": "a car"}
+{"file_name": "train/306.jpg", "text": "a car"}
+{"file_name": "train/307.jpg", "text": "a car"}
+{"file_name": "train/308.jpg", "text": "a car"}
+{"file_name": "train/309.jpg", "text": "a car"}
+{"file_name": "train/310.jpg", "text": "a car"}
+{"file_name": "train/311.jpg", "text": "a car"}
+{"file_name": "train/312.jpg", "text": "a car"}
+{"file_name": "train/313.jpg", "text": "a car"}
+{"file_name": "train/314.jpg", "text": "a car"}
+{"file_name": "train/315.jpg", "text": "a car"}
+{"file_name": "train/316.jpg", "text": "a car"}
+{"file_name": "train/317.jpg", "text": "a car"}
+{"file_name": "train/318.jpg", "text": "a car"}
+{"file_name": "train/319.jpg", "text": "a car"}
+{"file_name": "train/320.jpg", "text": "a car"}
+{"file_name": "train/321.jpg", "text": "a car"}
+{"file_name": "train/322.jpg", "text": "a car"}
+{"file_name": "train/323.jpg", "text": "a car"}
+{"file_name": "train/324.jpg", "text": "a car"}
+{"file_name": "train/325.jpg", "text": "a car"}
+{"file_name": "train/326.jpg", "text": "a car"}
+{"file_name": "train/327.jpg", "text": "a car"}
+{"file_name": "train/328.jpg", "text": "a car"}
+{"file_name": "train/329.jpg", "text": "a car"}
+{"file_name": "train/330.jpg", "text": "a car"}
+{"file_name": "train/331.jpg", "text": "a car"}
+{"file_name": "train/332.jpg", "text": "a car"}
+{"file_name": "train/333.jpg", "text": "a car"}
+{"file_name": "train/334.jpg", "text": "a car"}
+{"file_name": "train/335.jpg", "text": "a car"}
+{"file_name": "train/336.jpg", "text": "a car"}
+{"file_name": "train/337.jpg", "text": "a car"}
+{"file_name": "train/338.jpg", "text": "a car"}
+{"file_name": "train/339.jpg", "text": "a car"}
+{"file_name": "train/340.jpg", "text": "a car"}
+{"file_name": "train/341.jpg", "text": "a car"}
+{"file_name": "train/342.jpg", "text": "a car"}
+{"file_name": "train/343.jpg", "text": "a car"}
+{"file_name": "train/344.jpg", "text": "a car"}
+{"file_name": "train/345.jpg", "text": "a car"}
+{"file_name": "train/346.jpg", "text": "a car"}
+{"file_name": "train/347.jpg", "text": "a car"}
+{"file_name": "train/348.jpg", "text": "a car"}
+{"file_name": "train/349.jpg", "text": "a car"}
+{"file_name": "train/350.jpg", "text": "a car"}
+{"file_name": "train/351.jpg", "text": "a car"}
+{"file_name": "train/352.jpg", "text": "a car"}
+{"file_name": "train/353.jpg", "text": "a car"}
+{"file_name": "train/354.jpg", "text": "a car"}
+{"file_name": "train/355.jpg", "text": "a car"}
+{"file_name": "train/356.jpg", "text": "a car"}
+{"file_name": "train/357.jpg", "text": "a car"}
+{"file_name": "train/358.jpg", "text": "a car"}
+{"file_name": "train/359.jpg", "text": "a car"}
+{"file_name": "train/360.jpg", "text": "a car"}
+{"file_name": "train/361.jpg", "text": "a car"}
+{"file_name": "train/362.jpg", "text": "a car"}
+{"file_name": "train/363.jpg", "text": "a car"}
+{"file_name": "train/364.jpg", "text": "a car"}
+{"file_name": "train/365.jpg", "text": "a car"}
+{"file_name": "train/366.jpg", "text": "a car"}
+{"file_name": "train/367.jpg", "text": "a car"}
+{"file_name": "train/368.jpg", "text": "a car"}
+{"file_name": "train/369.jpg", "text": "a car"}
+{"file_name": "train/370.jpg", "text": "a car"}
+{"file_name": "train/371.jpg", "text": "a car"}
+{"file_name": "train/372.jpg", "text": "a car"}
+{"file_name": "train/373.jpg", "text": "a car"}
+{"file_name": "train/374.jpg", "text": "a car"}
+{"file_name": "train/375.jpg", "text": "a car"}
+{"file_name": "train/376.jpg", "text": "a car"}
+{"file_name": "train/377.jpg", "text": "a car"}
+{"file_name": "train/378.jpg", "text": "a car"}
+{"file_name": "train/379.jpg", "text": "a car"}
+{"file_name": "train/380.jpg", "text": "a car"}
+{"file_name": "train/381.jpg", "text": "a car"}
+{"file_name": "train/382.jpg", "text": "a car"}
+{"file_name": "train/383.jpg", "text": "a car"}
+{"file_name": "train/384.jpg", "text": "a car"}
+{"file_name": "train/385.jpg", "text": "a car"}
+{"file_name": "train/386.jpg", "text": "a car"}
+{"file_name": "train/387.jpg", "text": "a car"}
+{"file_name": "train/388.jpg", "text": "a car"}
+{"file_name": "train/389.jpg", "text": "a car"}
+{"file_name": "train/390.jpg", "text": "a car"}
+{"file_name": "train/391.jpg", "text": "a car"}
+{"file_name": "train/392.jpg", "text": "a car"}
+{"file_name": "train/393.jpg", "text": "a car"}
+{"file_name": "train/394.jpg", "text": "a car"}
+{"file_name": "train/395.jpg", "text": "a car"}
+{"file_name": "train/396.jpg", "text": "a car"}
+{"file_name": "train/397.jpg", "text": "a car"}
+{"file_name": "train/398.jpg", "text": "a car"}
+{"file_name": "train/399.jpg", "text": "a car"}
+{"file_name": "train/400.jpg", "text": "a car"}
+{"file_name": "train/401.jpg", "text": "a car"}
+{"file_name": "train/402.jpg", "text": "a car"}
+{"file_name": "train/403.jpg", "text": "a car"}
+{"file_name": "train/404.jpg", "text": "a car"}
+{"file_name": "train/405.jpg", "text": "a car"}
+{"file_name": "train/406.jpg", "text": "a car"}
+{"file_name": "train/407.jpg", "text": "a car"}
+{"file_name": "train/408.jpg", "text": "a car"}
+{"file_name": "train/409.jpg", "text": "a car"}
+{"file_name": "train/410.jpg", "text": "a car"}
+{"file_name": "train/411.jpg", "text": "a car"}
+{"file_name": "train/412.jpg", "text": "a car"}
+{"file_name": "train/413.jpg", "text": "a car"}
+{"file_name": "train/414.jpg", "text": "a car"}
+{"file_name": "train/415.jpg", "text": "a car"}
+{"file_name": "train/416.jpg", "text": "a car"}
+{"file_name": "train/417.jpg", "text": "a car"}
+{"file_name": "train/418.jpg", "text": "a car"}
+{"file_name": "train/419.jpg", "text": "a car"}
+{"file_name": "train/420.jpg", "text": "a car"}
+{"file_name": "train/421.jpg", "text": "a car"}
+{"file_name": "train/422.jpg", "text": "a car"}
+{"file_name": "train/423.jpg", "text": "a car"}
+{"file_name": "train/424.jpg", "text": "a car"}
+{"file_name": "train/425.jpg", "text": "a car"}
+{"file_name": "train/426.jpg", "text": "a car"}
+{"file_name": "train/427.jpg", "text": "a car"}
+{"file_name": "train/428.jpg", "text": "a car"}
+{"file_name": "train/429.jpg", "text": "a car"}
+{"file_name": "train/430.jpg", "text": "a car"}
+{"file_name": "train/431.jpg", "text": "a car"}
+{"file_name": "train/432.jpg", "text": "a car"}
+{"file_name": "train/433.jpg", "text": "a car"}
+{"file_name": "train/434.jpg", "text": "a car"}
+{"file_name": "train/435.jpg", "text": "a car"}
+{"file_name": "train/436.jpg", "text": "a car"}
+{"file_name": "train/437.jpg", "text": "a car"}
+{"file_name": "train/438.jpg", "text": "a car"}
+{"file_name": "train/439.jpg", "text": "a car"}
+{"file_name": "train/440.jpg", "text": "a car"}
+{"file_name": "train/441.jpg", "text": "a car"}
+{"file_name": "train/442.jpg", "text": "a car"}
+{"file_name": "train/443.jpg", "text": "a car"}
+{"file_name": "train/444.jpg", "text": "a car"}
+{"file_name": "train/445.jpg", "text": "a car"}
+{"file_name": "train/446.jpg", "text": "a car"}
+{"file_name": "train/447.jpg", "text": "a car"}
+{"file_name": "train/448.jpg", "text": "a car"}
+{"file_name": "train/449.jpg", "text": "a car"}
+{"file_name": "train/450.jpg", "text": "a car"}
+{"file_name": "train/451.jpg", "text": "a car"}
+{"file_name": "train/452.jpg", "text": "a car"}
+{"file_name": "train/453.jpg", "text": "a car"}
+{"file_name": "train/454.jpg", "text": "a car"}
+{"file_name": "train/455.jpg", "text": "a car"}
+{"file_name": "train/456.jpg", "text": "a car"}
+{"file_name": "train/457.jpg", "text": "a car"}
+{"file_name": "train/458.jpg", "text": "a car"}
+{"file_name": "train/459.jpg", "text": "a car"}
+{"file_name": "train/460.jpg", "text": "a car"}
+{"file_name": "train/461.jpg", "text": "a car"}
+{"file_name": "train/462.jpg", "text": "a car"}
+{"file_name": "train/463.jpg", "text": "a car"}
+{"file_name": "train/464.jpg", "text": "a car"}
+{"file_name": "train/465.jpg", "text": "a car"}
+{"file_name": "train/466.jpg", "text": "a car"}
+{"file_name": "train/467.jpg", "text": "a car"}
+{"file_name": "train/468.jpg", "text": "a car"}
+{"file_name": "train/469.jpg", "text": "a car"}
+{"file_name": "train/470.jpg", "text": "a car"}
+{"file_name": "train/471.jpg", "text": "a car"}
+{"file_name": "train/472.jpg", "text": "a car"}
+{"file_name": "train/473.jpg", "text": "a car"}
+{"file_name": "train/474.jpg", "text": "a car"}
+{"file_name": "train/475.jpg", "text": "a car"}
+{"file_name": "train/476.jpg", "text": "a car"}
+{"file_name": "train/477.jpg", "text": "a car"}
+{"file_name": "train/478.jpg", "text": "a car"}
+{"file_name": "train/479.jpg", "text": "a car"}
+{"file_name": "train/480.jpg", "text": "a car"}
+{"file_name": "train/481.jpg", "text": "a car"}
+{"file_name": "train/482.jpg", "text": "a car"}
+{"file_name": "train/483.jpg", "text": "a car"}
+{"file_name": "train/484.jpg", "text": "a car"}
+{"file_name": "train/485.jpg", "text": "a car"}
+{"file_name": "train/486.jpg", "text": "a car"}
+{"file_name": "train/487.jpg", "text": "a car"}
+{"file_name": "train/488.jpg", "text": "a car"}
+{"file_name": "train/489.jpg", "text": "a car"}
+{"file_name": "train/490.jpg", "text": "a car"}
+{"file_name": "train/491.jpg", "text": "a car"}
+{"file_name": "train/492.jpg", "text": "a car"}
+{"file_name": "train/493.jpg", "text": "a car"}
+{"file_name": "train/494.jpg", "text": "a car"}
+{"file_name": "train/495.jpg", "text": "a car"}
+{"file_name": "train/496.jpg", "text": "a car"}
+{"file_name": "train/497.jpg", "text": "a car"}
+{"file_name": "train/498.jpg", "text": "a car"}
+{"file_name": "train/499.jpg", "text": "a car"}
+{"file_name": "train/500.jpg", "text": "a car"}
+{"file_name": "train/501.jpg", "text": "a car"}
+{"file_name": "train/502.jpg", "text": "a car"}
+{"file_name": "train/503.jpg", "text": "a car"}
+{"file_name": "train/504.jpg", "text": "a car"}
+{"file_name": "train/505.jpg", "text": "a car"}
+{"file_name": "train/506.jpg", "text": "a car"}
+{"file_name": "train/507.jpg", "text": "a car"}
+{"file_name": "train/508.jpg", "text": "a car"}
+{"file_name": "train/509.jpg", "text": "a car"}
+{"file_name": "train/510.jpg", "text": "a car"}
+{"file_name": "train/511.jpg", "text": "a car"}
+{"file_name": "train/512.jpg", "text": "a car"}
+{"file_name": "train/513.jpg", "text": "a car"}
+{"file_name": "train/514.jpg", "text": "a car"}
+{"file_name": "train/515.jpg", "text": "a car"}
+{"file_name": "train/516.jpg", "text": "a car"}
+{"file_name": "train/517.jpg", "text": "a car"}
+{"file_name": "train/518.jpg", "text": "a car"}
+{"file_name": "train/519.jpg", "text": "a car"}
+{"file_name": "train/520.jpg", "text": "a car"}
+{"file_name": "train/521.jpg", "text": "a car"}
+{"file_name": "train/522.jpg", "text": "a car"}
+{"file_name": "train/523.jpg", "text": "a car"}
+{"file_name": "train/524.jpg", "text": "a car"}
+{"file_name": "train/525.jpg", "text": "a car"}
+{"file_name": "train/526.jpg", "text": "a car"}
+{"file_name": "train/527.jpg", "text": "a car"}
+{"file_name": "train/528.jpg", "text": "a car"}
+{"file_name": "train/529.jpg", "text": "a car"}
+{"file_name": "train/530.jpg", "text": "a car"}
+{"file_name": "train/531.jpg", "text": "a car"}
+{"file_name": "train/532.jpg", "text": "a car"}
+{"file_name": "train/533.jpg", "text": "a car"}
+{"file_name": "train/534.jpg", "text": "a car"}
+{"file_name": "train/535.jpg", "text": "a car"}
+{"file_name": "train/536.jpg", "text": "a car"}
+{"file_name": "train/537.jpg", "text": "a car"}
+{"file_name": "train/538.jpg", "text": "a car"}
+{"file_name": "train/539.jpg", "text": "a car"}
+{"file_name": "train/540.jpg", "text": "a car"}
+{"file_name": "train/541.jpg", "text": "a car"}
+{"file_name": "train/542.jpg", "text": "a car"}
+{"file_name": "train/543.jpg", "text": "a car"}
+{"file_name": "train/544.jpg", "text": "a car"}
+{"file_name": "train/545.jpg", "text": "a car"}
+{"file_name": "train/546.jpg", "text": "a car"}
+{"file_name": "train/547.jpg", "text": "a car"}
+{"file_name": "train/548.jpg", "text": "a car"}
+{"file_name": "train/549.jpg", "text": "a car"}
+{"file_name": "train/550.jpg", "text": "a car"}
+{"file_name": "train/551.jpg", "text": "a car"}
+{"file_name": "train/552.jpg", "text": "a car"}
+{"file_name": "train/553.jpg", "text": "a car"}
+{"file_name": "train/554.jpg", "text": "a car"}
+{"file_name": "train/555.jpg", "text": "a car"}
+{"file_name": "train/556.jpg", "text": "a car"}
+{"file_name": "train/557.jpg", "text": "a car"}
+{"file_name": "train/558.jpg", "text": "a car"}
+{"file_name": "train/559.jpg", "text": "a car"}
+{"file_name": "train/560.jpg", "text": "a car"}
+{"file_name": "train/561.jpg", "text": "a car"}
+{"file_name": "train/562.jpg", "text": "a car"}
+{"file_name": "train/563.jpg", "text": "a car"}
+{"file_name": "train/564.jpg", "text": "a car"}
+{"file_name": "train/565.jpg", "text": "a car"}
+{"file_name": "train/566.jpg", "text": "a car"}
+{"file_name": "train/567.jpg", "text": "a car"}
+{"file_name": "train/568.jpg", "text": "a car"}
+{"file_name": "train/569.jpg", "text": "a car"}
+{"file_name": "train/570.jpg", "text": "a car"}
+{"file_name": "train/571.jpg", "text": "a car"}
+{"file_name": "train/572.jpg", "text": "a car"}
+{"file_name": "train/573.jpg", "text": "a car"}
+{"file_name": "train/574.jpg", "text": "a car"}
+{"file_name": "train/575.jpg", "text": "a car"}
+{"file_name": "train/576.jpg", "text": "a car"}
+{"file_name": "train/577.jpg", "text": "a car"}
+{"file_name": "train/578.jpg", "text": "a car"}
+{"file_name": "train/579.jpg", "text": "a car"}
+{"file_name": "train/580.jpg", "text": "a car"}
+{"file_name": "train/581.jpg", "text": "a car"}
+{"file_name": "train/582.jpg", "text": "a car"}
+{"file_name": "train/583.jpg", "text": "a car"}
+{"file_name": "train/584.jpg", "text": "a car"}
+{"file_name": "train/585.jpg", "text": "a car"}
+{"file_name": "train/586.jpg", "text": "a car"}
+{"file_name": "train/587.jpg", "text": "a car"}
+{"file_name": "train/588.jpg", "text": "a car"}
+{"file_name": "train/589.jpg", "text": "a car"}
+{"file_name": "train/590.jpg", "text": "a car"}
+{"file_name": "train/591.jpg", "text": "a car"}
+{"file_name": "train/592.jpg", "text": "a car"}
+{"file_name": "train/593.jpg", "text": "a car"}
+{"file_name": "train/594.jpg", "text": "a car"}
+{"file_name": "train/595.jpg", "text": "a car"}
+{"file_name": "train/596.jpg", "text": "a car"}
+{"file_name": "train/597.jpg", "text": "a car"}
+{"file_name": "train/598.jpg", "text": "a car"}
+{"file_name": "train/599.jpg", "text": "a car"}
+{"file_name": "train/600.jpg", "text": "a car"}
+{"file_name": "train/601.jpg", "text": "a car"}
+{"file_name": "train/602.jpg", "text": "a car"}
+{"file_name": "train/603.jpg", "text": "a car"}
+{"file_name": "train/604.jpg", "text": "a car"}
+{"file_name": "train/605.jpg", "text": "a car"}
+{"file_name": "train/606.jpg", "text": "a car"}
+{"file_name": "train/607.jpg", "text": "a car"}
+{"file_name": "train/608.jpg", "text": "a car"}
+{"file_name": "train/609.jpg", "text": "a car"}
+{"file_name": "train/610.jpg", "text": "a car"}
+{"file_name": "train/611.jpg", "text": "a car"}
+{"file_name": "train/612.jpg", "text": "a car"}
+{"file_name": "train/613.jpg", "text": "a car"}
+{"file_name": "train/614.jpg", "text": "a car"}
+{"file_name": "train/615.jpg", "text": "a car"}
+{"file_name": "train/616.jpg", "text": "a car"}
+{"file_name": "train/617.jpg", "text": "a car"}
+{"file_name": "train/618.jpg", "text": "a car"}
+{"file_name": "train/619.jpg", "text": "a car"}
+{"file_name": "train/620.jpg", "text": "a car"}
+{"file_name": "train/621.jpg", "text": "a car"}
+{"file_name": "train/622.jpg", "text": "a car"}
+{"file_name": "train/623.jpg", "text": "a car"}
+{"file_name": "train/624.jpg", "text": "a car"}
+{"file_name": "train/625.jpg", "text": "a car"}
+{"file_name": "train/626.jpg", "text": "a car"}
+{"file_name": "train/627.jpg", "text": "a car"}
+{"file_name": "train/628.jpg", "text": "a car"}
+{"file_name": "train/629.jpg", "text": "a car"}
+{"file_name": "train/630.jpg", "text": "a car"}
+{"file_name": "train/631.jpg", "text": "a car"}
+{"file_name": "train/632.jpg", "text": "a car"}
+{"file_name": "train/633.jpg", "text": "a car"}
+{"file_name": "train/634.jpg", "text": "a car"}
+{"file_name": "train/635.jpg", "text": "a car"}
+{"file_name": "train/636.jpg", "text": "a car"}
+{"file_name": "train/637.jpg", "text": "a car"}
+{"file_name": "train/638.jpg", "text": "a car"}
+{"file_name": "train/639.jpg", "text": "a car"}
+{"file_name": "train/640.jpg", "text": "a car"}
+{"file_name": "train/641.jpg", "text": "a car"}
+{"file_name": "train/642.jpg", "text": "a car"}
+{"file_name": "train/643.jpg", "text": "a car"}
+{"file_name": "train/644.jpg", "text": "a car"}
+{"file_name": "train/645.jpg", "text": "a car"}
+{"file_name": "train/646.jpg", "text": "a car"}
+{"file_name": "train/647.jpg", "text": "a car"}
+{"file_name": "train/648.jpg", "text": "a car"}
+{"file_name": "train/649.jpg", "text": "a car"}
+{"file_name": "train/650.jpg", "text": "a car"}
+{"file_name": "train/651.jpg", "text": "a car"}
+{"file_name": "train/652.jpg", "text": "a car"}
+{"file_name": "train/653.jpg", "text": "a car"}
+{"file_name": "train/654.jpg", "text": "a car"}
+{"file_name": "train/655.jpg", "text": "a car"}
+{"file_name": "train/656.jpg", "text": "a car"}
+{"file_name": "train/657.jpg", "text": "a car"}
+{"file_name": "train/658.jpg", "text": "a car"}
+{"file_name": "train/659.jpg", "text": "a car"}
+{"file_name": "train/660.jpg", "text": "a car"}
+{"file_name": "train/661.jpg", "text": "a car"}
+{"file_name": "train/662.jpg", "text": "a car"}
+{"file_name": "train/663.jpg", "text": "a car"}
+{"file_name": "train/664.jpg", "text": "a car"}
+{"file_name": "train/665.jpg", "text": "a car"}
+{"file_name": "train/666.jpg", "text": "a car"}
+{"file_name": "train/667.jpg", "text": "a car"}
+{"file_name": "train/668.jpg", "text": "a car"}
+{"file_name": "train/669.jpg", "text": "a car"}
+{"file_name": "train/670.jpg", "text": "a car"}
+{"file_name": "train/671.jpg", "text": "a car"}
+{"file_name": "train/672.jpg", "text": "a car"}
+{"file_name": "train/673.jpg", "text": "a car"}
+{"file_name": "train/674.jpg", "text": "a car"}
+{"file_name": "train/675.jpg", "text": "a car"}
+{"file_name": "train/676.jpg", "text": "a car"}
+{"file_name": "train/677.jpg", "text": "a car"}
+{"file_name": "train/678.jpg", "text": "a car"}
+{"file_name": "train/679.jpg", "text": "a car"}
+{"file_name": "train/680.jpg", "text": "a car"}
+{"file_name": "train/681.jpg", "text": "a car"}
+{"file_name": "train/682.jpg", "text": "a car"}
+{"file_name": "train/683.jpg", "text": "a car"}
+{"file_name": "train/684.jpg", "text": "a car"}
+{"file_name": "train/685.jpg", "text": "a car"}
+{"file_name": "train/686.jpg", "text": "a car"}
+{"file_name": "train/687.jpg", "text": "a car"}
+{"file_name": "train/688.jpg", "text": "a car"}
+{"file_name": "train/689.jpg", "text": "a car"}
+{"file_name": "train/690.jpg", "text": "a car"}
+{"file_name": "train/691.jpg", "text": "a car"}
+{"file_name": "train/692.jpg", "text": "a car"}
+{"file_name": "train/693.jpg", "text": "a car"}
+{"file_name": "train/694.jpg", "text": "a car"}
+{"file_name": "train/695.jpg", "text": "a car"}
+{"file_name": "train/696.jpg", "text": "a car"}
+{"file_name": "train/697.jpg", "text": "a car"}
+{"file_name": "train/698.jpg", "text": "a car"}
+{"file_name": "train/699.jpg", "text": "a car"}
+{"file_name": "train/700.jpg", "text": "a car"}
+{"file_name": "train/701.jpg", "text": "a car"}
+{"file_name": "train/702.jpg", "text": "a car"}
+{"file_name": "train/703.jpg", "text": "a car"}
+{"file_name": "train/704.jpg", "text": "a car"}
+{"file_name": "train/705.jpg", "text": "a car"}
+{"file_name": "train/706.jpg", "text": "a car"}
+{"file_name": "train/707.jpg", "text": "a car"}
+{"file_name": "train/708.jpg", "text": "a car"}
+{"file_name": "train/709.jpg", "text": "a car"}
+{"file_name": "train/710.jpg", "text": "a car"}
+{"file_name": "train/711.jpg", "text": "a car"}
+{"file_name": "train/712.jpg", "text": "a car"}
+{"file_name": "train/713.jpg", "text": "a car"}
+{"file_name": "train/714.jpg", "text": "a car"}
+{"file_name": "train/715.jpg", "text": "a car"}
+{"file_name": "train/716.jpg", "text": "a car"}
+{"file_name": "train/717.jpg", "text": "a car"}
+{"file_name": "train/718.jpg", "text": "a car"}
+{"file_name": "train/719.jpg", "text": "a car"}
+{"file_name": "train/720.jpg", "text": "a car"}
+{"file_name": "train/721.jpg", "text": "a car"}
+{"file_name": "train/722.jpg", "text": "a car"}
+{"file_name": "train/723.jpg", "text": "a car"}
+{"file_name": "train/724.jpg", "text": "a car"}
+{"file_name": "train/725.jpg", "text": "a car"}
+{"file_name": "train/726.jpg", "text": "a car"}
+{"file_name": "train/727.jpg", "text": "a car"}
+{"file_name": "train/728.jpg", "text": "a car"}
+{"file_name": "train/729.jpg", "text": "a car"}
+{"file_name": "train/730.jpg", "text": "a car"}
+{"file_name": "train/731.jpg", "text": "a car"}
+{"file_name": "train/732.jpg", "text": "a car"}
+{"file_name": "train/733.jpg", "text": "a car"}
+{"file_name": "train/734.jpg", "text": "a car"}
+{"file_name": "train/735.jpg", "text": "a car"}
+{"file_name": "train/736.jpg", "text": "a car"}
+{"file_name": "train/737.jpg", "text": "a car"}
+{"file_name": "train/738.jpg", "text": "a car"}
+{"file_name": "train/739.jpg", "text": "a car"}
+{"file_name": "train/740.jpg", "text": "a car"}
+{"file_name": "train/741.jpg", "text": "a car"}
+{"file_name": "train/742.jpg", "text": "a car"}
+{"file_name": "train/743.jpg", "text": "a car"}
+{"file_name": "train/744.jpg", "text": "a car"}
+{"file_name": "train/745.jpg", "text": "a car"}
+{"file_name": "train/746.jpg", "text": "a car"}
+{"file_name": "train/747.jpg", "text": "a car"}
+{"file_name": "train/748.jpg", "text": "a car"}
+{"file_name": "train/749.jpg", "text": "a car"}
+{"file_name": "train/750.jpg", "text": "a car"}
+{"file_name": "train/751.jpg", "text": "a car"}
+{"file_name": "train/752.jpg", "text": "a car"}
+{"file_name": "train/753.jpg", "text": "a car"}
+{"file_name": "train/754.jpg", "text": "a car"}
+{"file_name": "train/755.jpg", "text": "a car"}
+{"file_name": "train/756.jpg", "text": "a car"}
+{"file_name": "train/757.jpg", "text": "a car"}
+{"file_name": "train/758.jpg", "text": "a car"}
+{"file_name": "train/759.jpg", "text": "a car"}
+{"file_name": "train/760.jpg", "text": "a car"}
+{"file_name": "train/761.jpg", "text": "a car"}
+{"file_name": "train/762.jpg", "text": "a car"}
+{"file_name": "train/763.jpg", "text": "a car"}
+{"file_name": "train/764.jpg", "text": "a car"}
+{"file_name": "train/765.jpg", "text": "a car"}
+{"file_name": "train/766.jpg", "text": "a car"}
+{"file_name": "train/767.jpg", "text": "a car"}
+{"file_name": "train/768.jpg", "text": "a car"}
+{"file_name": "train/769.jpg", "text": "a car"}
+{"file_name": "train/770.jpg", "text": "a car"}
+{"file_name": "train/771.jpg", "text": "a car"}
+{"file_name": "train/772.jpg", "text": "a car"}
+{"file_name": "train/773.jpg", "text": "a car"}
+{"file_name": "train/774.jpg", "text": "a car"}
+{"file_name": "train/775.jpg", "text": "a car"}
+{"file_name": "train/776.jpg", "text": "a car"}
+{"file_name": "train/777.jpg", "text": "a car"}
+{"file_name": "train/778.jpg", "text": "a car"}
+{"file_name": "train/779.jpg", "text": "a car"}
+{"file_name": "train/780.jpg", "text": "a car"}
+{"file_name": "train/781.jpg", "text": "a car"}
+{"file_name": "train/782.jpg", "text": "a car"}
+{"file_name": "train/783.jpg", "text": "a car"}
+{"file_name": "train/784.jpg", "text": "a car"}
+{"file_name": "train/785.jpg", "text": "a car"}
+{"file_name": "train/786.jpg", "text": "a car"}
+{"file_name": "train/787.jpg", "text": "a car"}
+{"file_name": "train/788.jpg", "text": "a car"}
+{"file_name": "train/789.jpg", "text": "a car"}
+{"file_name": "train/790.jpg", "text": "a car"}
+{"file_name": "train/791.jpg", "text": "a car"}
+{"file_name": "train/792.jpg", "text": "a car"}
+{"file_name": "train/793.jpg", "text": "a car"}
+{"file_name": "train/794.jpg", "text": "a car"}
+{"file_name": "train/795.jpg", "text": "a car"}
+{"file_name": "train/796.jpg", "text": "a car"}
+{"file_name": "train/797.jpg", "text": "a car"}
+{"file_name": "train/798.jpg", "text": "a car"}
+{"file_name": "train/799.jpg", "text": "a car"}
+{"file_name": "train/800.jpg", "text": "a car"}
+{"file_name": "train/801.jpg", "text": "a car"}
+{"file_name": "train/802.jpg", "text": "a car"}
+{"file_name": "train/803.jpg", "text": "a car"}
+{"file_name": "train/804.jpg", "text": "a car"}
+{"file_name": "train/805.jpg", "text": "a car"}
+{"file_name": "train/806.jpg", "text": "a car"}
+{"file_name": "train/807.jpg", "text": "a car"}
+{"file_name": "train/808.jpg", "text": "a car"}
+{"file_name": "train/809.jpg", "text": "a car"}
+{"file_name": "train/810.jpg", "text": "a car"}
+{"file_name": "train/811.jpg", "text": "a car"}
+{"file_name": "train/812.jpg", "text": "a car"}
+{"file_name": "train/813.jpg", "text": "a car"}
+{"file_name": "train/814.jpg", "text": "a car"}
+{"file_name": "train/815.jpg", "text": "a car"}
+{"file_name": "train/816.jpg", "text": "a car"}
+{"file_name": "train/817.jpg", "text": "a car"}
+{"file_name": "train/818.jpg", "text": "a car"}
+{"file_name": "train/819.jpg", "text": "a car"}
+{"file_name": "train/820.jpg", "text": "a car"}
+{"file_name": "train/821.jpg", "text": "a car"}
+{"file_name": "train/822.jpg", "text": "a car"}
+{"file_name": "train/823.jpg", "text": "a car"}
+{"file_name": "train/824.jpg", "text": "a car"}
+{"file_name": "train/825.jpg", "text": "a car"}
+{"file_name": "train/826.jpg", "text": "a car"}
+{"file_name": "train/827.jpg", "text": "a car"}
+{"file_name": "train/828.jpg", "text": "a car"}
+{"file_name": "train/829.jpg", "text": "a car"}
+{"file_name": "train/830.jpg", "text": "a car"}
+{"file_name": "train/831.jpg", "text": "a car"}
+{"file_name": "train/832.jpg", "text": "a car"}
+{"file_name": "train/833.jpg", "text": "a car"}
+{"file_name": "train/834.jpg", "text": "a car"}
+{"file_name": "train/835.jpg", "text": "a car"}
+{"file_name": "train/836.jpg", "text": "a car"}
+{"file_name": "train/837.jpg", "text": "a car"}
+{"file_name": "train/838.jpg", "text": "a car"}
+{"file_name": "train/839.jpg", "text": "a car"}
+{"file_name": "train/840.jpg", "text": "a car"}
+{"file_name": "train/841.jpg", "text": "a car"}
+{"file_name": "train/842.jpg", "text": "a car"}
+{"file_name": "train/843.jpg", "text": "a car"}
+{"file_name": "train/844.jpg", "text": "a car"}
+{"file_name": "train/845.jpg", "text": "a car"}
+{"file_name": "train/846.jpg", "text": "a car"}
+{"file_name": "train/847.jpg", "text": "a car"}
+{"file_name": "train/848.jpg", "text": "a car"}
+{"file_name": "train/849.jpg", "text": "a car"}
+{"file_name": "train/850.jpg", "text": "a car"}
+{"file_name": "train/851.jpg", "text": "a car"}
+{"file_name": "train/852.jpg", "text": "a car"}
+{"file_name": "train/853.jpg", "text": "a car"}
+{"file_name": "train/854.jpg", "text": "a car"}
+{"file_name": "train/855.jpg", "text": "a car"}
+{"file_name": "train/856.jpg", "text": "a car"}
+{"file_name": "train/857.jpg", "text": "a car"}
+{"file_name": "train/858.jpg", "text": "a car"}
+{"file_name": "train/859.jpg", "text": "a car"}
+{"file_name": "train/860.jpg", "text": "a car"}
+{"file_name": "train/861.jpg", "text": "a car"}
+{"file_name": "train/862.jpg", "text": "a car"}
+{"file_name": "train/863.jpg", "text": "a car"}
+{"file_name": "train/864.jpg", "text": "a car"}
+{"file_name": "train/865.jpg", "text": "a car"}
+{"file_name": "train/866.jpg", "text": "a car"}
+{"file_name": "train/867.jpg", "text": "a car"}
+{"file_name": "train/868.jpg", "text": "a car"}
+{"file_name": "train/869.jpg", "text": "a car"}
+{"file_name": "train/870.jpg", "text": "a car"}
+{"file_name": "train/871.jpg", "text": "a car"}
+{"file_name": "train/872.jpg", "text": "a car"}
+{"file_name": "train/873.jpg", "text": "a car"}
+{"file_name": "train/874.jpg", "text": "a car"}
+{"file_name": "train/875.jpg", "text": "a car"}
+{"file_name": "train/876.jpg", "text": "a car"}
+{"file_name": "train/877.jpg", "text": "a car"}
+{"file_name": "train/878.jpg", "text": "a car"}
+{"file_name": "train/879.jpg", "text": "a car"}
+{"file_name": "train/880.jpg", "text": "a car"}
+{"file_name": "train/881.jpg", "text": "a car"}
+{"file_name": "train/882.jpg", "text": "a car"}
+{"file_name": "train/883.jpg", "text": "a car"}
+{"file_name": "train/884.jpg", "text": "a car"}
+{"file_name": "train/885.jpg", "text": "a car"}
+{"file_name": "train/886.jpg", "text": "a car"}
+{"file_name": "train/887.jpg", "text": "a car"}
+{"file_name": "train/888.jpg", "text": "a car"}
+{"file_name": "train/889.jpg", "text": "a car"}
+{"file_name": "train/890.jpg", "text": "a car"}
+{"file_name": "train/891.jpg", "text": "a car"}
+{"file_name": "train/892.jpg", "text": "a car"}
+{"file_name": "train/893.jpg", "text": "a car"}
+{"file_name": "train/894.jpg", "text": "a car"}
+{"file_name": "train/895.jpg", "text": "a car"}
+{"file_name": "train/896.jpg", "text": "a car"}
+{"file_name": "train/897.jpg", "text": "a car"}
+{"file_name": "train/898.jpg", "text": "a car"}
+{"file_name": "train/899.jpg", "text": "a car"}
+{"file_name": "train/900.jpg", "text": "a car"}
+{"file_name": "train/901.jpg", "text": "a car"}
+{"file_name": "train/902.jpg", "text": "a car"}
+{"file_name": "train/903.jpg", "text": "a car"}
+{"file_name": "train/904.jpg", "text": "a car"}
+{"file_name": "train/905.jpg", "text": "a car"}
+{"file_name": "train/906.jpg", "text": "a car"}
+{"file_name": "train/907.jpg", "text": "a car"}
+{"file_name": "train/908.jpg", "text": "a car"}
+{"file_name": "train/909.jpg", "text": "a car"}
+{"file_name": "train/910.jpg", "text": "a car"}
+{"file_name": "train/911.jpg", "text": "a car"}
+{"file_name": "train/912.jpg", "text": "a car"}
+{"file_name": "train/913.jpg", "text": "a car"}
+{"file_name": "train/914.jpg", "text": "a car"}
+{"file_name": "train/915.jpg", "text": "a car"}
+{"file_name": "train/916.jpg", "text": "a car"}
+{"file_name": "train/917.jpg", "text": "a car"}
+{"file_name": "train/918.jpg", "text": "a car"}
+{"file_name": "train/919.jpg", "text": "a car"}
+{"file_name": "train/920.jpg", "text": "a car"}
+{"file_name": "train/921.jpg", "text": "a car"}
+{"file_name": "train/922.jpg", "text": "a car"}
+{"file_name": "train/923.jpg", "text": "a car"}
+{"file_name": "train/924.jpg", "text": "a car"}
+{"file_name": "train/925.jpg", "text": "a car"}
+{"file_name": "train/926.jpg", "text": "a car"}
+{"file_name": "train/927.jpg", "text": "a car"}
+{"file_name": "train/928.jpg", "text": "a car"}
+{"file_name": "train/929.jpg", "text": "a car"}
+{"file_name": "train/930.jpg", "text": "a car"}
+{"file_name": "train/931.jpg", "text": "a car"}
+{"file_name": "train/932.jpg", "text": "a car"}
+{"file_name": "train/933.jpg", "text": "a car"}
+{"file_name": "train/934.jpg", "text": "a car"}
+{"file_name": "train/935.jpg", "text": "a car"}
+{"file_name": "train/936.jpg", "text": "a car"}
+{"file_name": "train/937.jpg", "text": "a car"}
+{"file_name": "train/938.jpg", "text": "a car"}
+{"file_name": "train/939.jpg", "text": "a car"}
+{"file_name": "train/940.jpg", "text": "a car"}
+{"file_name": "train/941.jpg", "text": "a car"}
+{"file_name": "train/942.jpg", "text": "a car"}
+{"file_name": "train/943.jpg", "text": "a car"}
+{"file_name": "train/944.jpg", "text": "a car"}
+{"file_name": "train/945.jpg", "text": "a car"}
+{"file_name": "train/946.jpg", "text": "a car"}
+{"file_name": "train/947.jpg", "text": "a car"}
+{"file_name": "train/948.jpg", "text": "a car"}
+{"file_name": "train/949.jpg", "text": "a car"}
+{"file_name": "train/950.jpg", "text": "a car"}
+{"file_name": "train/951.jpg", "text": "a car"}
+{"file_name": "train/952.jpg", "text": "a car"}
+{"file_name": "train/953.jpg", "text": "a car"}
+{"file_name": "train/954.jpg", "text": "a car"}
+{"file_name": "train/955.jpg", "text": "a car"}
+{"file_name": "train/956.jpg", "text": "a car"}
+{"file_name": "train/957.jpg", "text": "a car"}
+{"file_name": "train/958.jpg", "text": "a car"}
+{"file_name": "train/959.jpg", "text": "a car"}
+{"file_name": "train/960.jpg", "text": "a car"}
+{"file_name": "train/961.jpg", "text": "a car"}
+{"file_name": "train/962.jpg", "text": "a car"}
+{"file_name": "train/963.jpg", "text": "a car"}
+{"file_name": "train/964.jpg", "text": "a car"}
+{"file_name": "train/965.jpg", "text": "a car"}
+{"file_name": "train/966.jpg", "text": "a car"}
+{"file_name": "train/967.jpg", "text": "a car"}
+{"file_name": "train/968.jpg", "text": "a car"}
+{"file_name": "train/969.jpg", "text": "a car"}
+{"file_name": "train/970.jpg", "text": "a car"}
+{"file_name": "train/971.jpg", "text": "a car"}
+{"file_name": "train/972.jpg", "text": "a car"}
+{"file_name": "train/973.jpg", "text": "a car"}
+{"file_name": "train/974.jpg", "text": "a car"}
+{"file_name": "train/975.jpg", "text": "a car"}
+{"file_name": "train/976.jpg", "text": "a car"}
+{"file_name": "train/977.jpg", "text": "a car"}
+{"file_name": "train/978.jpg", "text": "a car"}
+{"file_name": "train/979.jpg", "text": "a car"}
+{"file_name": "train/980.jpg", "text": "a car"}
+{"file_name": "train/981.jpg", "text": "a car"}
+{"file_name": "train/982.jpg", "text": "a car"}
+{"file_name": "train/983.jpg", "text": "a car"}
+{"file_name": "train/984.jpg", "text": "a car"}
+{"file_name": "train/985.jpg", "text": "a car"}
+{"file_name": "train/986.jpg", "text": "a car"}
+{"file_name": "train/987.jpg", "text": "a car"}
+{"file_name": "train/988.jpg", "text": "a car"}
+{"file_name": "train/989.jpg", "text": "a car"}
+{"file_name": "train/990.jpg", "text": "a car"}
+{"file_name": "train/991.jpg", "text": "a car"}
+{"file_name": "train/992.jpg", "text": "a car"}
+{"file_name": "train/993.jpg", "text": "a car"}
+{"file_name": "train/994.jpg", "text": "a car"}
+{"file_name": "train/995.jpg", "text": "a car"}
+{"file_name": "train/996.jpg", "text": "a car"}
+{"file_name": "train/997.jpg", "text": "a car"}
+{"file_name": "train/998.jpg", "text": "a car"}
+{"file_name": "train/999.jpg", "text": "a car"}
+{"file_name": "train/1000.jpg", "text": "a car"}

models/ESD-X/esd-picasso_from_picasso-xattn_1-epochs_200.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f52f71a02de7c24b6191ec4385a6a5b08a7b2177458a7998dfffed28a6b49f50
-size 175883766

pytorch_env.yaml ADDED Viewed

	@@ -0,0 +1,228 @@

+name: pytorch_env
+channels:
+  - conda-forge
+  - defaults
+dependencies:
+  - _libgcc_mutex=0.1=conda_forge
+  - _openmp_mutex=4.5=2_gnu
+  - aiohappyeyeballs=2.4.0=py310h06a4308_0
+  - aiohttp=3.10.5=py310h5eee18b_0
+  - aiosignal=1.2.0=pyhd3eb1b0_0
+  - anyio=4.2.0=py310h06a4308_0
+  - argon2-cffi=21.3.0=pyhd3eb1b0_0
+  - argon2-cffi-bindings=21.2.0=py310h7f8727e_0
+  - arrow-cpp=16.1.0=hc1eb8f0_0
+  - asttokens=2.0.5=pyhd3eb1b0_0
+  - async-lru=2.0.4=py310h06a4308_0
+  - async-timeout=4.0.3=py310h06a4308_0
+  - attrs=23.1.0=py310h06a4308_0
+  - aws-c-auth=0.6.19=h5eee18b_0
+  - aws-c-cal=0.5.20=hdbd6064_0
+  - aws-c-common=0.8.5=h5eee18b_0
+  - aws-c-compression=0.2.16=h5eee18b_0
+  - aws-c-event-stream=0.2.15=h6a678d5_0
+  - aws-c-http=0.6.25=h5eee18b_0
+  - aws-c-io=0.13.10=h5eee18b_0
+  - aws-c-mqtt=0.7.13=h5eee18b_0
+  - aws-c-s3=0.1.51=hdbd6064_0
+  - aws-c-sdkutils=0.1.6=h5eee18b_0
+  - aws-checksums=0.1.13=h5eee18b_0
+  - aws-crt-cpp=0.18.16=h6a678d5_0
+  - aws-sdk-cpp=1.10.55=h721c034_0
+  - babel=2.11.0=py310h06a4308_0
+  - beautifulsoup4=4.12.2=py310h06a4308_0
+  - blas=1.0=mkl
+  - bleach=4.1.0=pyhd3eb1b0_0
+  - boost-cpp=1.82.0=hdb19cb5_2
+  - bottleneck=1.3.7=py310ha9d4c09_0
+  - brotli-python=1.0.9=py310h6a678d5_8
+  - bzip2=1.0.8=hd590300_5
+  - c-ares=1.19.1=h5eee18b_0
+  - ca-certificates=2024.9.24=h06a4308_0
+  - certifi=2024.8.30=py310h06a4308_0
+  - cffi=1.16.0=py310h5eee18b_1
+  - charset-normalizer=2.0.4=pyhd3eb1b0_0
+  - comm=0.2.1=py310h06a4308_0
+  - datasets=2.19.1=py310h06a4308_0
+  - debugpy=1.6.7=py310h6a678d5_0
+  - decorator=5.1.1=pyhd3eb1b0_0
+  - defusedxml=0.7.1=pyhd3eb1b0_0
+  - dill=0.3.8=py310h06a4308_0
+  - exceptiongroup=1.2.0=py310h06a4308_0
+  - executing=0.8.3=pyhd3eb1b0_0
+  - frozenlist=1.4.0=py310h5eee18b_0
+  - gflags=2.2.2=h6a678d5_1
+  - glog=0.5.0=h6a678d5_1
+  - huggingface_hub=0.24.6=py310h06a4308_0
+  - icu=73.1=h6a678d5_0
+  - idna=3.7=py310h06a4308_0
+  - intel-openmp=2023.1.0=hdb19cb5_46306
+  - ipykernel=6.28.0=py310h06a4308_0
+  - ipython=8.20.0=py310h06a4308_0
+  - jedi=0.18.1=py310h06a4308_1
+  - jinja2=3.1.3=py310h06a4308_0
+  - json5=0.9.6=pyhd3eb1b0_0
+  - jsonschema=4.19.2=py310h06a4308_0
+  - jsonschema-specifications=2023.7.1=py310h06a4308_0
+  - jupyter-lsp=2.2.0=py310h06a4308_0
+  - jupyter_client=8.6.0=py310h06a4308_0
+  - jupyter_core=5.5.0=py310h06a4308_0
+  - jupyter_events=0.8.0=py310h06a4308_0
+  - jupyter_server=2.10.0=py310h06a4308_0
+  - jupyter_server_terminals=0.4.4=py310h06a4308_1
+  - jupyterlab=4.0.11=py310h06a4308_0
+  - jupyterlab_pygments=0.1.2=py_0
+  - jupyterlab_server=2.25.1=py310h06a4308_0
+  - krb5=1.20.1=h143b758_1
+  - ld_impl_linux-64=2.40=h55db66e_0
+  - libabseil=20240116.2=cxx17_h6a678d5_0
+  - libboost=1.82.0=h109eef0_2
+  - libbrotlicommon=1.0.9=h5eee18b_8
+  - libbrotlidec=1.0.9=h5eee18b_8
+  - libbrotlienc=1.0.9=h5eee18b_8
+  - libcurl=8.9.1=h251f7ec_0
+  - libedit=3.1.20230828=h5eee18b_0
+  - libev=4.33=h7f8727e_1
+  - libevent=2.1.12=hdbd6064_1
+  - libffi=3.4.2=h7f98852_5
+  - libgcc-ng=13.2.0=h77fa898_7
+  - libgomp=13.2.0=h77fa898_7
+  - libgrpc=1.62.2=h2d74bed_0
+  - libnghttp2=1.57.0=h2d74bed_0
+  - libnsl=2.0.1=hd590300_0
+  - libprotobuf=4.25.3=he621ea3_0
+  - libsodium=1.0.18=h7b6447c_0
+  - libssh2=1.11.0=h251f7ec_0
+  - libstdcxx-ng=11.2.0=h1234567_1
+  - libthrift=0.15.0=h1795dd8_2
+  - libuuid=1.41.5=h5eee18b_0
+  - libxcrypt=4.4.36=hd590300_1
+  - lz4-c=1.9.4=h6a678d5_1
+  - markupsafe=2.1.3=py310h5eee18b_0
+  - matplotlib-inline=0.1.6=py310h06a4308_0
+  - mistune=2.0.4=py310h06a4308_0
+  - mkl=2023.1.0=h213fc3f_46344
+  - mkl-service=2.4.0=py310h5eee18b_1
+  - mkl_fft=1.3.10=py310h5eee18b_0
+  - mkl_random=1.2.7=py310h1128e8f_0
+  - multidict=6.0.4=py310h5eee18b_0
+  - multiprocess=0.70.15=py310h06a4308_0
+  - nbclient=0.8.0=py310h06a4308_0
+  - nbconvert=7.10.0=py310h06a4308_0
+  - nbformat=5.9.2=py310h06a4308_0
+  - ncurses=6.5=h59595ed_0
+  - nest-asyncio=1.6.0=py310h06a4308_0
+  - notebook-shim=0.2.3=py310h06a4308_0
+  - numexpr=2.8.7=py310h85018f9_0
+  - numpy=1.26.4=py310h5f9d8c6_0
+  - numpy-base=1.26.4=py310hb5e798b_0
+  - openssl=3.0.15=h5eee18b_0
+  - orc=2.0.1=h2d29ad5_0
+  - overrides=7.4.0=py310h06a4308_0
+  - packaging=23.2=py310h06a4308_0
+  - pandas=2.2.2=py310h6a678d5_0
+  - pandocfilters=1.5.0=pyhd3eb1b0_0
+  - parso=0.8.3=pyhd3eb1b0_0
+  - pexpect=4.8.0=pyhd3eb1b0_3
+  - pip=24.0=pyhd8ed1ab_0
+  - platformdirs=3.10.0=py310h06a4308_0
+  - prometheus_client=0.14.1=py310h06a4308_0
+  - prompt-toolkit=3.0.43=py310h06a4308_0
+  - prompt_toolkit=3.0.43=hd3eb1b0_0
+  - psutil=5.9.0=py310h5eee18b_0
+  - ptyprocess=0.7.0=pyhd3eb1b0_2
+  - pure_eval=0.2.2=pyhd3eb1b0_0
+  - pyarrow=16.1.0=py310h1128e8f_0
+  - pycparser=2.21=pyhd3eb1b0_0
+  - pygments=2.15.1=py310h06a4308_1
+  - pysocks=1.7.1=py310h06a4308_0
+  - python=3.10.15=he870216_1
+  - python-dateutil=2.9.0post0=py310h06a4308_0
+  - python-fastjsonschema=2.16.2=py310h06a4308_0
+  - python-json-logger=2.0.7=py310h06a4308_0
+  - python-tzdata=2023.3=pyhd3eb1b0_0
+  - python-xxhash=2.0.2=py310h5eee18b_1
+  - pytz=2024.1=py310h06a4308_0
+  - pyyaml=6.0.1=py310h5eee18b_0
+  - pyzmq=25.1.2=py310h6a678d5_0
+  - re2=2022.04.01=h295c915_0
+  - readline=8.2=h8228510_1
+  - referencing=0.30.2=py310h06a4308_0
+  - requests=2.31.0=py310h06a4308_1
+  - rfc3339-validator=0.1.4=py310h06a4308_0
+  - rfc3986-validator=0.1.1=py310h06a4308_0
+  - rpds-py=0.10.6=py310hb02cf49_0
+  - s2n=1.3.27=hdbd6064_0
+  - send2trash=1.8.2=py310h06a4308_0
+  - setuptools=69.5.1=pyhd8ed1ab_0
+  - six=1.16.0=pyhd3eb1b0_1
+  - snappy=1.2.1=h6a678d5_0
+  - sniffio=1.3.0=py310h06a4308_0
+  - soupsieve=2.5=py310h06a4308_0
+  - sqlite=3.45.3=h5eee18b_0
+  - stack_data=0.2.0=pyhd3eb1b0_0
+  - tbb=2021.8.0=hdb19cb5_0
+  - terminado=0.17.1=py310h06a4308_0
+  - tinycss2=1.2.1=py310h06a4308_0
+  - tk=8.6.14=h39e8969_0
+  - tomli=2.0.1=py310h06a4308_0
+  - tornado=6.3.3=py310h5eee18b_0
+  - traitlets=5.7.1=py310h06a4308_0
+  - typing-extensions=4.11.0=py310h06a4308_0
+  - typing_extensions=4.11.0=py310h06a4308_0
+  - urllib3=2.2.1=py310h06a4308_0
+  - utf8proc=2.6.1=h5eee18b_1
+  - wcwidth=0.2.5=pyhd3eb1b0_0
+  - webencodings=0.5.1=py310h06a4308_1
+  - websocket-client=1.8.0=py310h06a4308_0
+  - wheel=0.43.0=pyhd8ed1ab_1
+  - xxhash=0.8.0=h7f8727e_3
+  - xz=5.4.6=h5eee18b_1
+  - yaml=0.2.5=h7b6447c_0
+  - yarl=1.11.0=py310h5eee18b_0
+  - zeromq=4.3.5=h6a678d5_0
+  - zlib=1.2.13=h5eee18b_1
+  - zstd=1.5.6=hc292b87_0
+  - pip:
+    - accelerate==0.30.1
+    - contourpy==1.2.1
+    - cycler==0.12.1
+    - diffusers==0.31.0
+    - filelock==3.14.0
+    - fonttools==4.51.0
+    - fsspec==2024.5.0
+    - git-lfs==1.6
+    - huggingface-hub==0.26.2
+    - importlib-metadata==7.1.0
+    - kiwisolver==1.4.5
+    - matplotlib==3.9.0
+    - mpmath==1.3.0
+    - networkx==3.3
+    - nvidia-cublas-cu12==12.1.3.1
+    - nvidia-cuda-cupti-cu12==12.1.105
+    - nvidia-cuda-nvrtc-cu12==12.1.105
+    - nvidia-cuda-runtime-cu12==12.1.105
+    - nvidia-cudnn-cu12==8.9.2.26
+    - nvidia-cufft-cu12==11.0.2.54
+    - nvidia-curand-cu12==10.3.2.106
+    - nvidia-cusolver-cu12==11.4.5.107
+    - nvidia-cusparse-cu12==12.1.0.106
+    - nvidia-nccl-cu12==2.20.5
+    - nvidia-nvjitlink-cu12==12.4.127
+    - nvidia-nvtx-cu12==12.1.105
+    - pillow==10.3.0
+    - pyparsing==3.1.2
+    - regex==2024.5.15
+    - safetensors==0.4.3
+    - scipy==1.13.0
+    - sympy==1.12
+    - tokenizers==0.19.1
+    - torch==2.3.0
+    - torchaudio==2.3.0
+    - torchvision==0.18.0
+    - tqdm==4.66.4
+    - transformers==4.41.0
+    - triton==2.3.0
+    - tzdata==2024.1
+    - zipp==3.18.2
+prefix: /home/lu.kev/.conda/envs/pytorch_env

test_gpu.py ADDED Viewed

	@@ -0,0 +1,11 @@

+import torch
+# Check if PyTorch is installed and environment is working
+print("Conda environment is working!")
+# Check for GPU availability
+if torch.cuda.is_available():
+    print("GPU is available!")
+    print(f"GPU Name: {torch.cuda.get_device_name(0)}")
+else:
+    print("GPU is not available.")