bghira commited on
Commit
08da3ef
·
verified ·
1 Parent(s): 7193873

Trained for 0 epochs and 250 steps.

Browse files

Trained with datasets ['text-embeds', 'sfwbooru-crop']
Learning rate 1.0, batch size 4, and 1 gradient accumulation steps.
Used DDPM noise scheduler for training with epsilon prediction type and rescaled_betas_zero_snr=False
Using 'trailing' timestep spacing.
Base model: stabilityai/stable-diffusion-3.5-medium
VAE: None

README.md CHANGED
@@ -12,287 +12,7 @@ tags:
12
 
13
 
14
  inference: true
15
- widget:
16
- - text: 'unconditional (blank prompt)'
17
- parameters:
18
- negative_prompt: 'blurry, cropped, ugly'
19
- output:
20
- url: ./assets/image_0_0.png
21
- - text: 'Alien planet, strange rock formations, glowing plants, bizarre creatures, surreal atmosphere'
22
- parameters:
23
- negative_prompt: 'blurry, cropped, ugly'
24
- output:
25
- url: ./assets/image_1_0.png
26
- - text: 'Alien marketplace, bizarre creatures, exotic goods, vibrant colors, otherworldly atmosphere'
27
- parameters:
28
- negative_prompt: 'blurry, cropped, ugly'
29
- output:
30
- url: ./assets/image_2_0.png
31
- - text: 'Child holding a balloon, happy expression, colorful balloons, sunny day, high detail'
32
- parameters:
33
- negative_prompt: 'blurry, cropped, ugly'
34
- output:
35
- url: ./assets/image_3_0.png
36
- - text: 'a 4-panel comic strip showing an orange cat saying the words ''HELP'' and ''LASAGNA'''
37
- parameters:
38
- negative_prompt: 'blurry, cropped, ugly'
39
- output:
40
- url: ./assets/image_4_0.png
41
- - text: 'a hand is holding a comic book with a cover that reads ''The Adventures of Superhero'''
42
- parameters:
43
- negative_prompt: 'blurry, cropped, ugly'
44
- output:
45
- url: ./assets/image_5_0.png
46
- - text: 'Underground cave filled with crystals, glowing lights, reflective surfaces, fantasy environment, high detail'
47
- parameters:
48
- negative_prompt: 'blurry, cropped, ugly'
49
- output:
50
- url: ./assets/image_6_0.png
51
- - text: 'Bustling cyberpunk bazaar, vendors, neon signs, advanced tech, crowded, high detail'
52
- parameters:
53
- negative_prompt: 'blurry, cropped, ugly'
54
- output:
55
- url: ./assets/image_7_0.png
56
- - text: 'Cyberpunk hacker in a dark room, neon glow, multiple screens, intense focus, high detail'
57
- parameters:
58
- negative_prompt: 'blurry, cropped, ugly'
59
- output:
60
- url: ./assets/image_8_0.png
61
- - text: 'a cybernetic anne of green gables with neural implant and bio mech augmentations'
62
- parameters:
63
- negative_prompt: 'blurry, cropped, ugly'
64
- output:
65
- url: ./assets/image_9_0.png
66
- - text: 'Post-apocalyptic cityscape, ruined buildings, overgrown vegetation, dark and gritty, high detail'
67
- parameters:
68
- negative_prompt: 'blurry, cropped, ugly'
69
- output:
70
- url: ./assets/image_10_0.png
71
- - text: 'Magical castle in a lush forest, glowing windows, fantasy architecture, high resolution, detailed textures'
72
- parameters:
73
- negative_prompt: 'blurry, cropped, ugly'
74
- output:
75
- url: ./assets/image_11_0.png
76
- - text: 'Ruins of an ancient temple in an enchanted forest, glowing runes, mystical creatures, high detail'
77
- parameters:
78
- negative_prompt: 'blurry, cropped, ugly'
79
- output:
80
- url: ./assets/image_12_0.png
81
- - text: 'Mystical forest, glowing plants, fairies, magical creatures, fantasy art, high detail'
82
- parameters:
83
- negative_prompt: 'blurry, cropped, ugly'
84
- output:
85
- url: ./assets/image_13_0.png
86
- - text: 'Magical garden with glowing flowers, fairies, serene atmosphere, detailed plants, high resolution'
87
- parameters:
88
- negative_prompt: 'blurry, cropped, ugly'
89
- output:
90
- url: ./assets/image_14_0.png
91
- - text: 'Whimsical garden filled with fairies, magical plants, sparkling lights, serene atmosphere, high detail'
92
- parameters:
93
- negative_prompt: 'blurry, cropped, ugly'
94
- output:
95
- url: ./assets/image_15_0.png
96
- - text: 'Majestic dragon soaring through the sky, detailed scales, dynamic pose, fantasy art, high resolution'
97
- parameters:
98
- negative_prompt: 'blurry, cropped, ugly'
99
- output:
100
- url: ./assets/image_16_0.png
101
- - text: 'Fantasy world, floating islands in the sky, waterfalls, lush vegetation, detailed landscape, high resolution'
102
- parameters:
103
- negative_prompt: 'blurry, cropped, ugly'
104
- output:
105
- url: ./assets/image_17_0.png
106
- - text: 'Futuristic city skyline at night, neon lights, cyberpunk style, high contrast, sharp focus'
107
- parameters:
108
- negative_prompt: 'blurry, cropped, ugly'
109
- output:
110
- url: ./assets/image_18_0.png
111
- - text: 'Space battle scene, starships fighting, laser beams, explosions, cosmic background'
112
- parameters:
113
- negative_prompt: 'blurry, cropped, ugly'
114
- output:
115
- url: ./assets/image_19_0.png
116
- - text: 'Abandoned fairground at night, eerie rides, ghostly figures, fog, dark atmosphere, high detail'
117
- parameters:
118
- negative_prompt: 'blurry, cropped, ugly'
119
- output:
120
- url: ./assets/image_20_0.png
121
- - text: 'Spooky haunted mansion on a hill, dark and eerie, glowing windows, ghostly atmosphere, high detail'
122
- parameters:
123
- negative_prompt: 'blurry, cropped, ugly'
124
- output:
125
- url: ./assets/image_21_0.png
126
- - text: 'a hardcover physics textbook that is called PHYSICS FOR DUMMIES'
127
- parameters:
128
- negative_prompt: 'blurry, cropped, ugly'
129
- output:
130
- url: ./assets/image_22_0.png
131
- - text: 'Epic medieval battle, knights in armor, dynamic action, detailed landscape, high resolution'
132
- parameters:
133
- negative_prompt: 'blurry, cropped, ugly'
134
- output:
135
- url: ./assets/image_23_0.png
136
- - text: 'Bustling medieval market with merchants, knights, and jesters, vibrant colors, detailed'
137
- parameters:
138
- negative_prompt: 'blurry, cropped, ugly'
139
- output:
140
- url: ./assets/image_24_0.png
141
- - text: 'Cozy medieval tavern, warm firelight, adventurers drinking, detailed interior, rustic atmosphere'
142
- parameters:
143
- negative_prompt: 'blurry, cropped, ugly'
144
- output:
145
- url: ./assets/image_25_0.png
146
- - text: 'Futuristic city skyline at night, neon lights, cyberpunk style, high contrast, sharp focus'
147
- parameters:
148
- negative_prompt: 'blurry, cropped, ugly'
149
- output:
150
- url: ./assets/image_26_0.png
151
- - text: 'Forest with neon-lit trees, glowing plants, bioluminescence, surreal atmosphere, high detail'
152
- parameters:
153
- negative_prompt: 'blurry, cropped, ugly'
154
- output:
155
- url: ./assets/image_27_0.png
156
- - text: 'Bright neon sign in a busy city street, ''Open 24 Hours'', bold typography, glowing lights'
157
- parameters:
158
- negative_prompt: 'blurry, cropped, ugly'
159
- output:
160
- url: ./assets/image_28_0.png
161
- - text: 'Vibrant neon sign, ''Bar'', bold typography, dark background, glowing lights, detailed design'
162
- parameters:
163
- negative_prompt: 'blurry, cropped, ugly'
164
- output:
165
- url: ./assets/image_29_0.png
166
- - text: 'Pirate ship on the high seas, stormy weather, detailed sails, dramatic waves, photorealistic'
167
- parameters:
168
- negative_prompt: 'blurry, cropped, ugly'
169
- output:
170
- url: ./assets/image_30_0.png
171
- - text: 'Pirate discovering a treasure chest, detailed gold coins, tropical island, dramatic lighting'
172
- parameters:
173
- negative_prompt: 'blurry, cropped, ugly'
174
- output:
175
- url: ./assets/image_31_0.png
176
- - text: 'a photograph of a woman experiencing a psychedelic trip. trippy, 8k, uhd, fractal'
177
- parameters:
178
- negative_prompt: 'blurry, cropped, ugly'
179
- output:
180
- url: ./assets/image_32_0.png
181
- - text: 'Cozy cafe on a rainy day, people sipping coffee, warm lights, reflections on wet pavement, photorealistic'
182
- parameters:
183
- negative_prompt: 'blurry, cropped, ugly'
184
- output:
185
- url: ./assets/image_33_0.png
186
- - text: '1980s arcade, neon lights, vintage game machines, kids playing, vibrant colors, nostalgic atmosphere'
187
- parameters:
188
- negative_prompt: 'blurry, cropped, ugly'
189
- output:
190
- url: ./assets/image_34_0.png
191
- - text: '1980s game room with vintage arcade machines, neon lights, vibrant colors, nostalgic feel'
192
- parameters:
193
- negative_prompt: 'blurry, cropped, ugly'
194
- output:
195
- url: ./assets/image_35_0.png
196
- - text: 'Robot blacksmith forging metal, sparks flying, detailed workshop, futuristic and medieval blend'
197
- parameters:
198
- negative_prompt: 'blurry, cropped, ugly'
199
- output:
200
- url: ./assets/image_36_0.png
201
- - text: 'Sleek robot performing a dance, futuristic theater, holographic effects, detailed, high resolution'
202
- parameters:
203
- negative_prompt: 'blurry, cropped, ugly'
204
- output:
205
- url: ./assets/image_37_0.png
206
- - text: 'High-tech factory where robots are assembled, detailed machinery, futuristic setting, high detail'
207
- parameters:
208
- negative_prompt: 'blurry, cropped, ugly'
209
- output:
210
- url: ./assets/image_38_0.png
211
- - text: 'Garden tended by robots, mechanical plants, colorful flowers, futuristic setting, high detail'
212
- parameters:
213
- negative_prompt: 'blurry, cropped, ugly'
214
- output:
215
- url: ./assets/image_39_0.png
216
- - text: 'Cute robotic pet, futuristic home, sleek design, detailed features, friendly and animated'
217
- parameters:
218
- negative_prompt: 'blurry, cropped, ugly'
219
- output:
220
- url: ./assets/image_40_0.png
221
- - text: 'cctv trail camera night time security picture of a wendigo in the woods'
222
- parameters:
223
- negative_prompt: 'blurry, cropped, ugly'
224
- output:
225
- url: ./assets/image_41_0.png
226
- - text: 'Astronaut exploring an alien planet, detailed landscape, futuristic suit, cosmic background'
227
- parameters:
228
- negative_prompt: 'blurry, cropped, ugly'
229
- output:
230
- url: ./assets/image_42_0.png
231
- - text: 'Futuristic space station orbiting a distant exoplanet, sleek design, detailed structures, cosmic backdrop'
232
- parameters:
233
- negative_prompt: 'blurry, cropped, ugly'
234
- output:
235
- url: ./assets/image_43_0.png
236
- - text: 'a person holding a sign that reads ''SOON'''
237
- parameters:
238
- negative_prompt: 'blurry, cropped, ugly'
239
- output:
240
- url: ./assets/image_44_0.png
241
- - text: 'Steampunk airship in the sky, intricate design, Victorian aesthetics, dynamic scene, high detail'
242
- parameters:
243
- negative_prompt: 'blurry, cropped, ugly'
244
- output:
245
- url: ./assets/image_45_0.png
246
- - text: 'Steampunk inventor in a workshop, intricate gadgets, Victorian attire, mechanical arm, goggles'
247
- parameters:
248
- negative_prompt: 'blurry, cropped, ugly'
249
- output:
250
- url: ./assets/image_46_0.png
251
- - text: 'Stormy ocean with towering waves, dramatic skies, detailed water, intense atmosphere, high resolution'
252
- parameters:
253
- negative_prompt: 'blurry, cropped, ugly'
254
- output:
255
- url: ./assets/image_47_0.png
256
- - text: 'Dramatic stormy sea, lighthouse in the distance, lightning striking, dark clouds, high detail'
257
- parameters:
258
- negative_prompt: 'blurry, cropped, ugly'
259
- output:
260
- url: ./assets/image_48_0.png
261
- - text: 'Graffiti artist creating a mural, vibrant colors, urban setting, dynamic action, high resolution'
262
- parameters:
263
- negative_prompt: 'blurry, cropped, ugly'
264
- output:
265
- url: ./assets/image_49_0.png
266
- - text: 'Urban alleyway filled with vibrant graffiti art, tags and murals, realistic textures'
267
- parameters:
268
- negative_prompt: 'blurry, cropped, ugly'
269
- output:
270
- url: ./assets/image_50_0.png
271
- - text: 'Urban street sign, ''Main Street'', bold typography, realistic textures, weathered look'
272
- parameters:
273
- negative_prompt: 'blurry, cropped, ugly'
274
- output:
275
- url: ./assets/image_51_0.png
276
- - text: 'Classic car show with vintage vehicles, vibrant colors, nostalgic atmosphere, high detail'
277
- parameters:
278
- negative_prompt: 'blurry, cropped, ugly'
279
- output:
280
- url: ./assets/image_52_0.png
281
- - text: 'Retro diner sign, ''Joe''s Diner'', classic 1950s design, neon lights, weathered look'
282
- parameters:
283
- negative_prompt: 'blurry, cropped, ugly'
284
- output:
285
- url: ./assets/image_53_0.png
286
- - text: 'Vintage store sign with elaborate typography, ''Antique Shop'', hand-painted, weathered look'
287
- parameters:
288
- negative_prompt: 'blurry, cropped, ugly'
289
- output:
290
- url: ./assets/image_54_0.png
291
- - text: 'A photo-realistic image of a cat'
292
- parameters:
293
- negative_prompt: 'blurry, cropped, ugly'
294
- output:
295
- url: ./assets/image_55_0.png
296
  ---
297
 
298
  # sd35m-sfwbooru
@@ -317,7 +37,7 @@ A photo-realistic image of a cat
317
 
318
  Note: The validation settings are not necessarily the same as the [training settings](#training-settings).
319
 
320
- You can find some example images in the following gallery:
321
 
322
 
323
  <Gallery />
@@ -329,7 +49,7 @@ You may reuse the base model text encoder for inference.
329
  ## Training settings
330
 
331
  - Training epochs: 0
332
- - Training steps: 1750
333
  - Learning rate: 1.0
334
  - Learning rate schedule: cosine
335
  - Warmup steps: 500000
 
12
 
13
 
14
  inference: true
15
+
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  ---
17
 
18
  # sd35m-sfwbooru
 
37
 
38
  Note: The validation settings are not necessarily the same as the [training settings](#training-settings).
39
 
40
+
41
 
42
 
43
  <Gallery />
 
49
  ## Training settings
50
 
51
  - Training epochs: 0
52
+ - Training steps: 250
53
  - Learning rate: 1.0
54
  - Learning rate schedule: cosine
55
  - Warmup steps: 500000
optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f2b56d5958266737e04d7c24462b8785f0495d58554999682477e1ee8ec9a47
3
- size 5313950865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:867a4873c3ae7a55c17e2475d96f08628b7e968e56f0a6bd01bd982049e128fc
3
+ size 5313950929
random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4971ffa3ec5806e655820078f11abe5540c1c70414825d7c13ae9a024edbe61
3
  size 14408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99bf871de134557de54bf77d25fb31f777f2224fcd6e6041e47ce5a6d2672026
3
  size 14408
scheduler.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04cd64d17d9f39c8a525a7e06ce158b5f50c6b4f49254fc1e6dc9348d660675e
3
- size 1000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7252e5c3f58be52fe8c2c37582fc18c90e2e3f299e3e1dc7fcda246d4ddfd9ba
3
+ size 1128
training_state-sfwbooru-crop.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bf596ef079d003b4401239a2e442c81b93c7c93aae09c6ceef81625709eb2f3
3
- size 14878962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b584aa4e8c0691b04b41ef75dd99145adfee762272ae6c2fa4d8342506c4f51a
3
+ size 14602962
training_state.json CHANGED
@@ -1 +1 @@
1
- {"global_step": 1750, "epoch_step": 1750, "epoch": 1, "exhausted_backends": [], "repeats": {}}
 
1
+ {"global_step": 250, "epoch_step": 250, "epoch": 1, "exhausted_backends": [], "repeats": {}}
transformer/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95d0405de3c62116ac59d28e104e7069bb8a6c49324e9ae8f9361ab11ab6ddf1
3
  size 4939433672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd0b062ab396e14ef93fe1a72d59e70aff5b1a8b6783f523c90b57f4bb060e7
3
  size 4939433672
transformer_ema/config.json CHANGED
@@ -26,7 +26,7 @@
26
  "min_decay": 0.0,
27
  "num_attention_heads": 24,
28
  "num_layers": 24,
29
- "optimization_step": 1750,
30
  "out_channels": 16,
31
  "patch_size": 2,
32
  "pooled_projection_dim": 2048,
 
26
  "min_decay": 0.0,
27
  "num_attention_heads": 24,
28
  "num_layers": 24,
29
+ "optimization_step": 250,
30
  "out_channels": 16,
31
  "patch_size": 2,
32
  "pooled_projection_dim": 2048,
transformer_ema/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c9720b40b55a18ba6ee8c1076b965a37b9084e9050e98423dca11a02fd4f5ff
3
  size 9878760864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5666aee4d3ab5b474c86a7d97a30fcb9d5245ed9b18139acf66bfb9f8dd9bb
3
  size 9878760864
transformer_ema/ema_model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83a6537d90639a875ab22f5b39350447241a043588c3d7bc9f59e2efcdafc95b
3
  size 4486612394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae6831ac6a6884470566705f4870ee81b03d8f3e5c0c4674b7f979cfa4e8a430
3
  size 4486612394