Add files using upload-large-folder tool
Browse files- .gitattributes +3 -0
- checkpoints/Qwen2.5-0.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/model.safetensors +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
- checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00001-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00002-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00005-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00006-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors +3 -0
- checkpoints/Qwen2.5-7B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors +3 -0
.gitattributes
CHANGED
@@ -133,3 +133,6 @@ checkpoints/Qwen2.5-0.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/to
|
|
133 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-0.5B/blobs/88c142557820ccad55bb59756bfcfcf891de9cc6202816bd346445188a0ed342 filter=lfs diff=lfs merge=lfs -text
|
134 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
135 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
133 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-0.5B/blobs/88c142557820ccad55bb59756bfcfcf891de9cc6202816bd346445188a0ed342 filter=lfs diff=lfs merge=lfs -text
|
134 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
135 |
checkpoints/Qwen2.5-0.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
136 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
137 |
+
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
138 |
+
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoints/Qwen2.5-0.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ddc3c16ca115844d6eda713a70e40e8a0ad011234709683bd502bff33b7aaa2
|
3 |
+
size 1260367152
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1624ef9770b8f455f1fa79fd5fa6ffca4c49ba7f89fc032dc21b0a014579023b
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72bd953fd767cfc5bbb80660ae99e4d0fb61156c00f0b685b4427e6957756bc9
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecd83fc7e66c5df56d1de2cf94904a61d23ed07d056f5f3fb227cdd17f187772
|
3 |
+
size 11422536
|
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6077415ede742c09f6b95b3d1141bc308027e4015e3994963228a75ee63a2db
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
|
3 |
+
size 11421896
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f76918371b6c8d743e69eccad6f60c7cf3b16ff7e72dda7abd716e4b4472e8c
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
|
3 |
+
size 14448
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-50/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f76918371b6c8d743e69eccad6f60c7cf3b16ff7e72dda7abd716e4b4472e8c
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e6ec0c8311bc44bf18da345ce9eede9aa5e521ea1bb189b19ab0c8766101dcd
|
3 |
+
size 4986211200
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c36d4ee30b71003c0056069b8514ea0f123c553468f287f5c829f8135ff5d6f
|
3 |
+
size 4954847240
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c86f37de3b554fe472495c8be24c5a54d67ae03f9c53602b6bc3b22157de68c
|
3 |
+
size 4954847280
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1591cf4b9b2b0fae1a89bd7f26fcbe2958e512881ec2d782340acb470bd5c42c
|
3 |
+
size 4734533096
|
checkpoints/Qwen2.5-7B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3754046240b4371da14adbd643da586f89025e248a1e56e3ea73abb5ff28c9ff
|
3 |
+
size 4330865088
|
checkpoints/Qwen2.5-7B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9b43b7914e4a851c9cad1ed26df2ddefa2a1371405fc64c3e02dc1752872000
|
3 |
+
size 4932750888
|