Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +10 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors +3 -0
.gitattributes
CHANGED
@@ -139,3 +139,13 @@ checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/token
|
|
139 |
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
140 |
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
141 |
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
139 |
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
140 |
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
141 |
checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
142 |
+
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
143 |
+
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
144 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
145 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
146 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
|
147 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
148 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
149 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
|
150 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
151 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
|
3 |
+
size 3087467144
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea894031550f052a88a6f7448c02831ed9cf20b1e417176d4208573554c6e73
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
|
3 |
+
size 11422356
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b76454021945f9531fb2ccbe7a32b66dd1f31ed30f310ad78bded418cb71d2
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
|
3 |
+
size 11422356
|
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
|
3 |
+
size 11421896
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
|
3 |
+
size 11421896
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
|
3 |
+
size 3087467144
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
|
3 |
+
size 3087467144
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
|
3 |
+
size 3087467144
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
|
3 |
+
size 3087467144
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b757d9e994524104820728f1347cc4a41247be150dc32b73b9b3f45deebe352f
|
3 |
+
size 4986211200
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75e0cfc2c662c54bf5e4a4c7e6037540386087c0cdf8e87feadab6b70b77539d
|
3 |
+
size 4954847240
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f651272df1b4a6e53555f54a447c664890d5ea60662fe11e3800bb117b15b595
|
3 |
+
size 4954847280
|
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:774afbf6338e2bf1ea5bd1b4d1bfff1384168de879aa4ac66a01b70ad7ff94a7
|
3 |
+
size 4877660672
|