Trained for 1 epochs and 64000 steps.
Browse filesTrained with datasets ['text-embeds', 'sfwbooru-crop']
Learning rate 1.0, batch size 6, and 1 gradient accumulation steps.
Used DDPM noise scheduler for training with epsilon prediction type and rescaled_betas_zero_snr=False
Using 'trailing' timestep spacing.
Base model: stabilityai/stable-diffusion-3.5-medium
VAE: None
- README.md +1 -1
- optimizer.bin +1 -1
- random_states_0.pkl +2 -2
- scheduler.bin +1 -1
- training_state-sfwbooru-crop.json +2 -2
- training_state.json +1 -1
- transformer/diffusion_pytorch_model.safetensors +1 -1
- transformer_ema/config.json +1 -1
- transformer_ema/diffusion_pytorch_model.safetensors +1 -1
- transformer_ema/ema_model.pt +1 -1
README.md
CHANGED
@@ -329,7 +329,7 @@ You may reuse the base model text encoder for inference.
|
|
329 |
## Training settings
|
330 |
|
331 |
- Training epochs: 1
|
332 |
-
- Training steps:
|
333 |
- Learning rate: 1.0
|
334 |
- Learning rate schedule: cosine
|
335 |
- Warmup steps: 500000
|
|
|
329 |
## Training settings
|
330 |
|
331 |
- Training epochs: 1
|
332 |
+
- Training steps: 64000
|
333 |
- Learning rate: 1.0
|
334 |
- Learning rate schedule: cosine
|
335 |
- Warmup steps: 500000
|
optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4493633377
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddb4738a7a1dc93a4c7f2dd30f5be36846175ff0c8a857f11501921af30fe470
|
3 |
size 4493633377
|
random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eca79f87743cada6146b3309c797b7eedb395f7e37a8a2a1b65fe120cbd5f7b
|
3 |
+
size 14344
|
scheduler.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1128
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7093755a4f3ebce2e83de789544f992488222401accbe122a828334206552e7
|
3 |
size 1128
|
training_state-sfwbooru-crop.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57c0c31e88ebd5551d8f2a9f84963bef0aa9a3ab4c37a37480a0896141c3d570
|
3 |
+
size 15158642
|
training_state.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"global_step":
|
|
|
1 |
+
{"global_step": 64000, "epoch_step": 64000, "epoch": 2, "exhausted_backends": [], "repeats": {"sfwbooru-crop": 0}}
|
transformer/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4939433672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7695eb5b5da1193d4460e89ae5e4aadc9cca33e6df9fcefec51ae79b0abc1f6
|
3 |
size 4939433672
|
transformer_ema/config.json
CHANGED
@@ -26,7 +26,7 @@
|
|
26 |
"min_decay": 0.0,
|
27 |
"num_attention_heads": 24,
|
28 |
"num_layers": 24,
|
29 |
-
"optimization_step":
|
30 |
"out_channels": 16,
|
31 |
"patch_size": 2,
|
32 |
"pooled_projection_dim": 2048,
|
|
|
26 |
"min_decay": 0.0,
|
27 |
"num_attention_heads": 24,
|
28 |
"num_layers": 24,
|
29 |
+
"optimization_step": 64000,
|
30 |
"out_channels": 16,
|
31 |
"patch_size": 2,
|
32 |
"pooled_projection_dim": 2048,
|
transformer_ema/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 9878760864
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ded7a841837604165d6e909a6f4f1b3f6348aef370b4fb5d8a6d0c7bdc65953
|
3 |
size 9878760864
|
transformer_ema/ema_model.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4486612394
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64a6ef41f961d9c3d754b0a773560dc2a1ca6c200f7fef295d93971a3eda15e3
|
3 |
size 4486612394
|