Yaning1001 commited on
Commit
78bdb8e
·
verified ·
1 Parent(s): 58cb75f

Add files using upload-large-folder tool

Browse files
Files changed (43) hide show
  1. .gitattributes +17 -0
  2. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors +3 -0
  3. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors +3 -0
  4. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors +3 -0
  5. checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1934/model-00006-of-00006.safetensors +3 -0
  6. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
  7. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
  8. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +3 -0
  9. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
  10. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +3 -0
  11. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
  12. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +3 -0
  13. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
  14. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors +3 -0
  15. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
  16. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
  17. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
  18. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors +3 -0
  19. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
  20. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
  21. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors +3 -0
  22. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_1.pth +3 -0
  23. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_2.pth +3 -0
  24. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_3.pth +3 -0
  25. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/scheduler.pt +3 -0
  26. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json +3 -0
  27. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/training_args.bin +3 -0
  28. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
  29. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
  30. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +3 -0
  31. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
  32. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +3 -0
  33. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
  34. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +3 -0
  35. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
  36. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors +3 -0
  37. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
  38. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
  39. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
  40. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors +3 -0
  41. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
  42. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
  43. checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors +3 -0
.gitattributes CHANGED
@@ -91,3 +91,20 @@ checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwe
91
  checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
92
  checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
93
  checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
91
  checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
92
  checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
93
  checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
94
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
95
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
96
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text
97
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
98
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
99
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
100
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
101
+ checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
102
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
103
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
104
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text
105
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
106
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
107
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
108
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
109
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
110
+ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:037a6104e8d346446495b5eac65e6f95f767784bb86976a522ba1d8d2ebccf38
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16ec32d87e8ce5e68825f56556a248a320087a2dec560d944de46d7743126f9d
3
+ size 4954847240
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:148a793687797aba9facb0b118201df3db239818567d2276b22a1dd1b9a6cfaa
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1934/model-00006-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa9f0f8b233569b82cd667e8c5ca8dc427eec8eca49dd45aa0a3438a645cf52
3
+ size 4734533096
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
3
+ size 3995348776
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
3
+ size 1698724408
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
3
+ size 3979614448
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
3
+ size 3885134104
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
3
+ size 3995327992
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
3
+ size 3885134104
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
3
+ size 3995327992
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
3
+ size 3995348776
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
3
+ size 3979614448
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
3
+ size 1698724408
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15cf6eeb694c805493de414d07ff667947929feec9e4f0fcf42ce5cf0a018ddb
3
+ size 14960
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdeb95f762226d00df8620ef583da32215d9a73bfb95bb43993ef6983a7ee1b9
3
+ size 14960
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e891007ffa086a3d99eebe131f1ed9435b0a35734c7e565ed116cb48c8c3f4
3
+ size 14960
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d912986edede51d039c7a1938014cdbf5c5652c76b4bc1e02a0281b27110931
3
+ size 1064
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f191cf2b92afb8bbc237c787c0a30b450f779f0671380457f9f73b0ca14995b0
3
+ size 6520
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
3
+ size 3995348776
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
3
+ size 1698724408
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
3
+ size 3979614448
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
3
+ size 3885134104
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
3
+ size 3995327992
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
3
+ size 3885134104
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
3
+ size 3995327992
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
3
+ size 3995348776
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
3
+ size 3979614448
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
3
+ size 3995328064
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
3
+ size 1698724408