Yaning1001 commited on
Commit
08508e4
·
verified ·
1 Parent(s): 45f49cb

Add files using upload-large-folder tool

Browse files
Files changed (35) hide show
  1. .gitattributes +4 -0
  2. checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00001-of-00006.safetensors +3 -0
  3. checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00003-of-00006.safetensors +3 -0
  4. checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00005-of-00006.safetensors +3 -0
  5. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00001-of-00006.safetensors +3 -0
  6. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00004-of-00006.safetensors +3 -0
  7. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00005-of-00006.safetensors +3 -0
  8. checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors +3 -0
  9. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00001-of-00006.safetensors +3 -0
  10. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00003-of-00006.safetensors +3 -0
  11. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00005-of-00006.safetensors +3 -0
  12. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors +3 -0
  13. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors +3 -0
  14. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00003-of-00006.safetensors +3 -0
  15. checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors +3 -0
  16. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth +3 -0
  17. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth +3 -0
  18. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt +3 -0
  19. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json +3 -0
  20. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin +3 -0
  21. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
  22. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
  23. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
  24. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
  25. checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
  26. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
  27. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
  28. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
  29. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
  30. checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
  31. checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
  32. checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
  33. checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
  34. checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
  35. checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
.gitattributes CHANGED
@@ -110,3 +110,7 @@ checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/model
110
  checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json filter=lfs diff=lfs merge=lfs -text
111
  checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
112
  checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
110
  checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json filter=lfs diff=lfs merge=lfs -text
111
  checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
112
  checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
113
+ checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
114
+ checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json filter=lfs diff=lfs merge=lfs -text
115
+ checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
116
+ checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81e4128a2d7503b09c0170e027200e2230103a7c004093060da4576aa276bb66
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00003-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c7b1f45b578a265bff5a04acb0ea9b1d8f98a9ffd11f4bbda7d7ec70d9f3a50
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/runs/checkpoint-1682/model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e153fcbd013c64f4191f09f51f0192fefbd037b3946e9a42559412e9ff1460b2
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2526ed6f72e2cb3b7f83e17bd33e188561ee7b9cdfd5027a3bab3465e0563ca6
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00004-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:708cfadd3b5e4466f4167405cf3f257ca83f8f8972296c13430a9a67b132b87d
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624ae1b0799b6c2dbf8852a2da1fb0746c007fba414d5cc0a3b0c6a8a3a16af3
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bceefb0df0d91d98b27fcfa7b6caf96e76f7aabb955e8caced63462d2a7181c7
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:368f4d27fa095163571428806b53892643e960f6cd3776d3152e5c947b881ca3
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00003-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9c514cb71d66e45b96d23c2b3c70713a13a9bb152ae1c06076ebdb2fd7156b9
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f70d9f7d5d854eca211da576b58b221a799c16c63c4c1abe03a53585806e31c
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:783c20cabe7cff788f2f377ba1e30041c39f4564c8a1fac06f8c8409659a05e5
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b083a43624470747040b126919a11c288fe10a0291f76eb14c936df3f88d0be4
3
+ size 4954847240
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00003-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b96a0ac369f6bfb21f50778f2f36aeecc61cef4288f66b6ac8ebc5f2dcfe48fe
3
+ size 4954847280
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/model-00004-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7819823617ed8fce1a4f57a21696d329f1d83a0c6c95d0d4769e1e9c12534209
3
+ size 4954847280
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4586e2577df5c7df99f7f22a9eb9c344aa93bfea80555b0225f947467a9d86
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1624ef9770b8f455f1fa79fd5fa6ffca4c49ba7f89fc032dc21b0a014579023b
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c54f6c898e2c4d700d91a0e23780ae401fe3d06588f050613f7dbc01771d8c
3
+ size 1064
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd83fc7e66c5df56d1de2cf94904a61d23ed07d056f5f3fb227cdd17f187772
3
+ size 11422536
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e433799628a7912ba5bba3114e75acf7d050267bfd6bf913c3a45f95bd7b9633
3
+ size 6520
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5fc6a13124c3b11ca061128177b35eda88f08b4546c4c3ba7fa375ded403ba5
3
+ size 1064
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2775aaa04243687a971b4fdea9993049392aa966f47084cd09878e65628bdd91
3
+ size 6520
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14be263ddae55a4d0ba547f494116d339b4c91e7ef69d00cb6af3bfeb3778c2
3
+ size 1064
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed6206c7c99f9bc3e1e0577e9acfec7afcca6d0b0e2a5f102e4ff2aa99e0c3b1
3
+ size 6520
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
3
+ size 14448
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:085de42942f9961f0bf09616d2cf0a824f124117f147dc3f2eaa5006e1bd8a8b
3
+ size 1064
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b2d3d5265579ff0a8b6e1301a14236bbd2f0ac977e2d12bc787dfe665a81a5
3
+ size 6520