Yaning1001 commited on
Commit
4f97cff
·
verified ·
1 Parent(s): edf49d1

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +10 -0
  2. checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
  3. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth +3 -0
  4. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth +3 -0
  5. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt +3 -0
  6. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json +3 -0
  7. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin +3 -0
  8. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
  9. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
  10. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
  11. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
  12. checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
  13. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
  14. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
  15. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
  16. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
  17. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
  18. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
  19. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
  20. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
  21. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
  22. checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
  23. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
  24. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
  25. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
  26. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
  27. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
  28. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
  29. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
  30. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
  31. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
  32. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
  33. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
  34. checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
  35. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +3 -0
  36. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors +3 -0
  37. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth +3 -0
  38. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth +3 -0
  39. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt +3 -0
  40. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json +3 -0
  41. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin +3 -0
  42. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth +3 -0
  43. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth +3 -0
  44. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt +3 -0
  45. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json +3 -0
  46. checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin +3 -0
  47. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors +3 -0
  48. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors +3 -0
  49. checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors +3 -0
  50. checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors +3 -0
.gitattributes CHANGED
@@ -139,3 +139,13 @@ checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/token
139
  checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
140
  checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
141
  checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
139
  checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
140
  checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
141
  checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
142
+ checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text
143
+ checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
144
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
145
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
146
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
147
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
148
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
149
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text
150
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text
151
+ checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dea894031550f052a88a6f7448c02831ed9cf20b1e417176d4208573554c6e73
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80b76454021945f9531fb2ccbe7a32b66dd1f31ed30f310ad78bded418cb71d2
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
3
+ size 11422356
checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796
3
+ size 3087467144
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7
3
+ size 6520
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5
3
+ size 14448
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d
3
+ size 1064
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
3
+ size 11422176
checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7
3
+ size 6520
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b757d9e994524104820728f1347cc4a41247be150dc32b73b9b3f45deebe352f
3
+ size 4986211200
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75e0cfc2c662c54bf5e4a4c7e6037540386087c0cdf8e87feadab6b70b77539d
3
+ size 4954847240
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f651272df1b4a6e53555f54a447c664890d5ea60662fe11e3800bb117b15b595
3
+ size 4954847280
checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:774afbf6338e2bf1ea5bd1b4d1bfff1384168de879aa4ac66a01b70ad7ff94a7
3
+ size 4877660672