Add files using upload-large-folder tool
Browse files- .gitattributes +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model.safetensors +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/model.safetensors +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/model.safetensors +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model.safetensors +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/model.safetensors +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00003-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00003-of-00004.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00003-of-00004.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors +3 -0
.gitattributes
CHANGED
@@ -136,3 +136,6 @@ checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoin
|
|
136 |
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
137 |
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
138 |
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
136 |
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
137 |
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
138 |
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
139 |
+
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
140 |
+
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
141 |
+
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoints/Qwen2.5-0.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76729eb1c7597bb816038a45d1bd201ade3f9cab68a4295be8823bc1c1d2913f
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0243a464739cccb01997fc142059b505b6e8b9a934409970fbd047b35fdc4599
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5190e422e2549c7b5f6e900ea33a2536289cf52401e76ff562e5c79b29d0cdd7
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-0.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b1d27e812bedabc1e979a96ed2867c0966f2a2d178bcb5af9eb0bfa70d3fb2d
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-0.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c53ef270b5b61748d88b3ffa8a3af14c761269a690dc66048acd939d469ab581
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a4586e2577df5c7df99f7f22a9eb9c344aa93bfea80555b0225f947467a9d86
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:266fcc533ea792552b7c19c9157314f16447b5399b6521b6b4a34d6f66ead908
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecd83fc7e66c5df56d1de2cf94904a61d23ed07d056f5f3fb227cdd17f187772
|
3 |
+
size 11422536
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6077415ede742c09f6b95b3d1141bc308027e4015e3994963228a75ee63a2db
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea894031550f052a88a6f7448c02831ed9cf20b1e417176d4208573554c6e73
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2233ac8a28cc4455a976ca2193883f1026fea3da73c41327fe19629a6ff32313
|
3 |
+
size 11422076
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b26f8adc089ba800b6869188c43c8ba46d9eff17df63812bd52b803b04d19fdb
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b76454021945f9531fb2ccbe7a32b66dd1f31ed30f310ad78bded418cb71d2
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2233ac8a28cc4455a976ca2193883f1026fea3da73c41327fe19629a6ff32313
|
3 |
+
size 11422076
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b26f8adc089ba800b6869188c43c8ba46d9eff17df63812bd52b803b04d19fdb
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00003-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f23372f78080fcde7cfac4448e6244ffb882acfc97c6d387fede431b45d8c3e0
|
3 |
+
size 4954847280
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6472f2e61cf236cbaf984c344d412889fd4b0c6f120bee7d84618b2d86c9ba5
|
3 |
+
size 4954847280
|
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f64dd3e58dbbd14971b1950101c14b1885671394546ef8e7b2b7373230e5ab0b
|
3 |
+
size 4330865088
|
checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0355367db772443a3bceb7e63d4b7925db88da86fc7ca67b8f8241c6aead97c3
|
3 |
+
size 4330865088
|
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dc0c52ab6e6e23f20b9d7393e625395a977c26106d8567b61f20069e8f39e2b
|
3 |
+
size 4330865088
|