diff --git a/.gitattributes b/.gitattributes index 42d2d9eb23531f1dbb10be95650412d08fb0de02..bd98b16fafcb4d307de32ef22dd4f73f8ca39ec0 100644 --- a/.gitattributes +++ b/.gitattributes @@ -139,3 +139,13 @@ checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/token checkpoints/Qwen2.5-1.5B/babylm_hop_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text checkpoints/Qwen2.5-1.5B/babylm_reverse_partial_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors b/checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de4b04359b427ed291b005f62b749531d45e3e5f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +size 3087467144 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd306cfe5bafca140505e8387970e7a987c09639 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5fa2e530092241493c32f0c0f39e627199122c47bb6f211aee29c5c16a79585 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2620dd8f51435befa9abf525bc4e5a65e8d556cc --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2461f099107bb643a77373b905b4b77530e8cc1b6a3a0574158caccf87f309a7 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc02aa509ca2a356e0255043f91cc7f224dde196 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea894031550f052a88a6f7448c02831ed9cf20b1e417176d4208573554c6e73 +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3b14f8affb24073c5b5274674f70277c042593dc --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516 +size 11422356 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a08a57c15a7cebf2796d6af2af9bdf297f5a673 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727 +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e91217c4ae9a57c7b3559730943e3ac86ac4993a --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5bb9d78abec4745ad306478fdca43f2c10cf7fed --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd53dc32b8f53673f5171a5201861a087708092 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b76454021945f9531fb2ccbe7a32b66dd1f31ed30f310ad78bded418cb71d2 +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3b14f8affb24073c5b5274674f70277c042593dc --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516 +size 11422356 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a08a57c15a7cebf2796d6af2af9bdf297f5a673 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_reverse_control_10M_seed0/runs/checkpoint-50/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505ce7403e185848d1da9ccc9de376fb2d5dad305d99b1e6e7cc973e5e6c6727 +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..22feddd863845a5d52ff9a64606bab649023fec3 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff541480f6d1472ca5e12b978d7f63e314d5839c --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10f198ee3ebfcb2d59eeae92feb96e34984a9af --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..d571e17ca2cfcbd9aaeb7faa2fc39fc12683a23f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088 +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e91217c4ae9a57c7b3559730943e3ac86ac4993a --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5bb9d78abec4745ad306478fdca43f2c10cf7fed --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..69aebbf5736830c6237c5716372d60b7bbbe01ee --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..d571e17ca2cfcbd9aaeb7faa2fc39fc12683a23f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_control_10M_seed0/runs/checkpoint-50/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f502ba9bc0dd572671c7986a9b5e17d174c072833cfbed027c27ca8b02d9088 +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 new file mode 100644 index 0000000000000000000000000000000000000000..de4b04359b427ed291b005f62b749531d45e3e5f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +size 3087467144 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de4b04359b427ed291b005f62b749531d45e3e5f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +size 3087467144 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..22feddd863845a5d52ff9a64606bab649023fec3 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff541480f6d1472ca5e12b978d7f63e314d5839c --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10f198ee3ebfcb2d59eeae92feb96e34984a9af --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..b51fd7d2118e8560395c8f1296a30f9d53447380 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7 +size 11422176 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd939d530ad8b49e95a5839f9acc090d78a816e3 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1290/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e91217c4ae9a57c7b3559730943e3ac86ac4993a --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5bb9d78abec4745ad306478fdca43f2c10cf7fed --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..69aebbf5736830c6237c5716372d60b7bbbe01ee --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..b51fd7d2118e8560395c8f1296a30f9d53447380 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7 +size 11422176 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd939d530ad8b49e95a5839f9acc090d78a816e3 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-50/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470e749c71d574f5d9ce69b2cd687489c87db3f2d9e418dd9b9ea4f629c38a2b +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 new file mode 100644 index 0000000000000000000000000000000000000000..de4b04359b427ed291b005f62b749531d45e3e5f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/blobs/a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +size 3087467144 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de4b04359b427ed291b005f62b749531d45e3e5f --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-1.5B/snapshots/8faed761d45a263340a0528343f099c05c9a4323/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a961db72e75d52b18e6b0c9d379e51a26973b233385e0e127fdda7d648aec796 +size 3087467144 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..22feddd863845a5d52ff9a64606bab649023fec3 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed2d17aef80308e7357fddddd9df5a92cbad7acc2e75e5ced938c7fd5c705de +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff541480f6d1472ca5e12b978d7f63e314d5839c --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e54406be159a669d37c2a8d1da2335a08a4290b5619b11dece5135899339ca4 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10f198ee3ebfcb2d59eeae92feb96e34984a9af --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db97a1417e300ff6b1875ef25b4d3b44d4916d206b40def602060e42239a70a +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..b51fd7d2118e8560395c8f1296a30f9d53447380 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7 +size 11422176 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2d55e237292c9f3b0017f3e615f063a0298a6ef --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-1290/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7 +size 6520 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e91217c4ae9a57c7b3559730943e3ac86ac4993a --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d60f0a8e64b11aa424754a846eeebee548dbc50a9d1a6a7c113160af51004f +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5bb9d78abec4745ad306478fdca43f2c10cf7fed --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f2a34760ec9ab498537a3bf9bcd8b3bba0757435d287a57b2ee1a30faa74d5 +size 14448 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..69aebbf5736830c6237c5716372d60b7bbbe01ee --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276598cead26a6101a885194fd8e9857656d4719c7ddc5c5c9c023fca95c664d +size 1064 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..b51fd7d2118e8560395c8f1296a30f9d53447380 --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7 +size 11422176 diff --git a/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2d55e237292c9f3b0017f3e615f063a0298a6ef --- /dev/null +++ b/checkpoints/Qwen2.5-1.5B/babylm_shuffle_even_odd_10M_seed0/runs/checkpoint-50/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6848746231ae1afdb3e39700a0da609f6d8e56b041274b9169e829a62f96abc7 +size 6520 diff --git a/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e88392ebe357fee4062469b444f971d3fe2a80dd --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b757d9e994524104820728f1347cc4a41247be150dc32b73b9b3f45deebe352f +size 4986211200 diff --git a/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c880dd4b2f605c0f7cf2452f6e4396c58d43926e --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e0cfc2c662c54bf5e4a4c7e6037540386087c0cdf8e87feadab6b70b77539d +size 4954847240 diff --git a/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5652c8799e4042bba0d942bf9416f3cb29aee71b --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f651272df1b4a6e53555f54a447c664890d5ea60662fe11e3800bb117b15b595 +size 4954847280 diff --git a/checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b853c281a0e094cd252a2ddc2eefca981ee8f17f --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_hop_control_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774afbf6338e2bf1ea5bd1b4d1bfff1384168de879aa4ac66a01b70ad7ff94a7 +size 4877660672 diff --git a/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58ae58e11863d9d0f60d38541e08794c49b17953 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b6838cfbf023009f4ff1e9af6212ae46d8ac87e1f7fcf5b06c0337530a3e8b +size 4877660672 diff --git a/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00002-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8be334e218fca3af94e3bbac78a75cc760ad87f --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_hop_words4_10M_seed0/runs/checkpoint-1122/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409b7b45349449b99abc7f04469ab24803cf7aeafa861e90b870d94fb4d05c7a +size 4932750888 diff --git a/checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..180306d82fac3ee967e1a7016c32e0c8070d4afc --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_reverse_control_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62cf4226687aefd27ec98a1af0a73099c6cec54222cbda52fd309e670cdd6c9b +size 4330865088 diff --git a/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00002-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05119bf86f755d13c911c5626b6cb21cecdd4f31 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa43e4e78d2d296f7961e6dde446bbbd13eaec503b35fbcad9619ec9cf33084e +size 4932750888 diff --git a/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a45e9c636082af452d091e75aec0d77939e8990 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_reverse_partial_10M_seed0/runs/checkpoint-1382/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600f907b3da6d1534077a617135ecb247b1bc3c1bbe5c4ef4ae095f8f2472337 +size 4330865088 diff --git a/checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e093e55681f35ae0380a10dceee9dca734aa6215 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1290/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18be20272f18aa67dc10170d64b418b32bf94774dd011f7bdefe490ca64e3df0 +size 4330865088 diff --git a/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53029bc7bbb21426266aa424f28d53bd653ce6e4 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9e1a82b770e3e609b2851ff2edfe43783558fefc0f83735535e8c25a0b92f58 +size 4877660672 diff --git a/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors b/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a12ab8a102c7a46847469edf425a66cce93d101 --- /dev/null +++ b/checkpoints/Qwen2.5-7B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1290/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d841a7370dff21650a05c3a695b7fbf9a03b6ee12adaedd738bb035ea7d558f +size 4932750888