Yaning1001 commited on
Commit
ca646ac
·
verified ·
1 Parent(s): 4f97cff

Add files using upload-large-folder tool

Browse files
Files changed (36) hide show
  1. .gitattributes +7 -0
  2. checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
  3. checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
  4. checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
  5. checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth +3 -0
  6. checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth +3 -0
  7. checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt +3 -0
  8. checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json +3 -0
  9. checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin +3 -0
  10. checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/rng_state_0.pth +3 -0
  11. checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/rng_state_1.pth +3 -0
  12. checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/scheduler.pt +3 -0
  13. checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/tokenizer.json +3 -0
  14. checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/training_args.bin +3 -0
  15. checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
  16. checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
  17. checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
  18. checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
  19. checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
  20. checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
  21. checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
  22. checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
  23. checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
  24. checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
  25. checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
  26. checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
  27. checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
  28. checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
  29. checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
  30. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00002-of-00004.safetensors +3 -0
  31. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00001-of-00004.safetensors +3 -0
  32. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00002-of-00004.safetensors +3 -0
  33. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00001-of-00004.safetensors +3 -0
  34. checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors +3 -0
  35. checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors +3 -0
  36. checkpoints/Qwen2.5-7B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors +3 -0
.gitattributes CHANGED
@@ -149,3 +149,10 @@ checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/to
149
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
150
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
151
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
149
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
150
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
151
  checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
152
+ checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
153
+ checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
154
+ checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
155
+ checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
156
+ checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
157
+ checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
158
+ checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_shuffle_nondeterministic_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4586e2577df5c7df99f7f22a9eb9c344aa93bfea80555b0225f947467a9d86
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1624ef9770b8f455f1fa79fd5fa6ffca4c49ba7f89fc032dc21b0a014579023b
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72bd953fd767cfc5bbb80660ae99e4d0fb61156c00f0b685b4427e6957756bc9
3
+ size 1064
checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd83fc7e66c5df56d1de2cf94904a61d23ed07d056f5f3fb227cdd17f187772
3
+ size 11422536
checkpoints/Qwen2.5-3B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d99e1ddbc8d491c289fadfb3f0b0612dda794e46529cda5059e763aa70f2528
3
+ size 6520
checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4586e2577df5c7df99f7f22a9eb9c344aa93bfea80555b0225f947467a9d86
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1624ef9770b8f455f1fa79fd5fa6ffca4c49ba7f89fc032dc21b0a014579023b
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5c41836229bdff3422379c674677c70e8d3240661acf74476cc91e31f193211
3
+ size 1064
checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd83fc7e66c5df56d1de2cf94904a61d23ed07d056f5f3fb227cdd17f187772
3
+ size 11422536
checkpoints/Qwen2.5-3B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e169f098a68b4661c2a2521e7db484dd445c1f0ca62b3572f0fc3889140ef51
3
+ size 6520
checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c42cbccd5d269445f5eb1566f25bcd51983815fb3b57b92b6e3a0ee915110c0
3
+ size 1064
checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-3B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4bb6f95b333552f9f8d35969d13ea720dd42273da395067da9c7fab0ed7593
3
+ size 6520
checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c42cbccd5d269445f5eb1566f25bcd51983815fb3b57b92b6e3a0ee915110c0
3
+ size 1064
checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-3B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e83ebcf42b6d00694aa9b2b3196da0e762ba65ced6098601c2e46e2c2d468205
3
+ size 6520
checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
3
+ size 14448
checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5ece3009f0dd4cdbfe8f9959c676941ec9c491dac2e1c44921e072bc1c9e639
3
+ size 1064
checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-3B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef5b2882b27e087d809932593d35f690889d7b3dd76a780aa657bed8e159d99
3
+ size 6520
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f40633f004176b2109772dc07f160e3d81ce616f4dae21ddcbe489499e86e48a
3
+ size 4932750888
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76d90df5c851682a030dc7f7afd4d57839eadfc6208a99002053be32783cafe7
3
+ size 4877660672
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea82ca4707d8122663a228e45f83d991c9faa58c0eec8a4d959687d416f9b5a
3
+ size 4932750888
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82fb9739cd7e7157d812431a475c27478cb6d784ce0b0c53caab8bbfae000c32
3
+ size 4877660672
checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d86c7f3ed731cf3ed7f34910b6c30c778c992882e3eae3ab740d3c16e4fe634
3
+ size 4877660672
checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d48a82f7a99cb23f8609b967c272e022c0b6e3cff03240069e6bed81d0ea6ea
3
+ size 4932750888
checkpoints/Qwen2.5-7B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:698bccf4cccc74a7705b457cff6fbeb2e1e40d2cbaf5a59479a70a6e7349298a
3
+ size 4877660672