diff --git a/.gitattributes b/.gitattributes index ce8edd1fa2dd26255bbafc1a98c3d4c667f1e4eb..6ed548b18d9a761c324777671f6b0c1fe6c7fbee 100644 --- a/.gitattributes +++ b/.gitattributes @@ -124,3 +124,11 @@ babylm_reverse_partial_10M_seed0/runs/checkpoint-100/tokenizer.json filter=lfs d babylm_reverse_partial_10M_seed0/runs/checkpoint-1000/tokenizer.json filter=lfs diff=lfs merge=lfs -text babylm_reverse_partial_10M_seed0/runs/checkpoint-2919/tokenizer.json filter=lfs diff=lfs merge=lfs -text babylm_reverse_partial_10M_seed0/runs/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb filter=lfs diff=lfs merge=lfs -text +babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 filter=lfs diff=lfs merge=lfs -text +babylm_reverse_control_10M_seed0/runs/checkpoint-1800/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_control_10M_seed0/runs/checkpoint-2700/tokenizer.json filter=lfs diff=lfs merge=lfs -text +babylm_reverse_control_10M_seed0/runs/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-1400/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-1400/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e723fb64ae1ee1bcbf858504d62a1529e08c3c0 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-1400/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbaff5b23cea7af9e77119d9303f8375f352da565821ad54f89d7a5c99891bec +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-1700/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-1700/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d196aa15c55d61d5e8a9c35ab847cc2754d93988 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-1700/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ba721e0cb6002fec40acf7b03f31a6122ef2a9168d82ecc4f2f60a8db40aee +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-2200/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-2200/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f86b34bc143cc5c1223cc7cd6683ff5a099b7ff3 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-2200/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de41c97f1b85191e92c9748ae33c27b2d434c86fe7e93eff7b504a9f4adc65c1 +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-2300/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-2300/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2121ad99f07a1f10987a2379e1e626e31e622d12 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-2300/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf9a4443150167813cb08d2019804bff1012d4de0b26e029d3d9ecaa172c144 +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-300/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-300/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16bd4ad9c557d5640d3ec133c6f3aab1dbca14a9 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-300/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b81f88af8ba9cea3f25cf3f9064180deb9040e3e1315e753d27980a52301fe +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-400/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-400/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa6cd19d2dccd5b0bdd5258f13e68522f0ffe3f8 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-400/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8059b0ab50260d73edb8e1bd28032119d3a4d4d8299988335931d9e215cd3c +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-700/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-700/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f39c4647d9c17760ae6591a94b8ebca5c87e62c --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-700/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0685c0493fb2fea5eed2a5f74ce427e29aeab8b71cb6db7b1bb42c7c34c67e +size 4965798912 diff --git a/babylm_hop_control_10M_seed0/runs/checkpoint-800/model-00001-of-00002.safetensors b/babylm_hop_control_10M_seed0/runs/checkpoint-800/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d54dcd15592a2adc53a3974e7d629f56020dce2 --- /dev/null +++ b/babylm_hop_control_10M_seed0/runs/checkpoint-800/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e2d812cfda48f4493dd70ac6b8aa9cbd2b4384242b58df2f7bf693f504c0e9 +size 4965798912 diff --git a/babylm_hop_tokens4_10M_seed0/runs/checkpoint-300/global_step300/zero_pp_rank_1_mp_rank_00_optim_states.pt b/babylm_hop_tokens4_10M_seed0/runs/checkpoint-300/global_step300/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de22495e93620cbc1c712691c2b3344850cbcc28 --- /dev/null +++ b/babylm_hop_tokens4_10M_seed0/runs/checkpoint-300/global_step300/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5aef1ba91d0911887f2e0e14fa6cb6b3ffa2dba6602ec9bf349fcc5ce5f7245 +size 12851010643 diff --git a/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb new file mode 100644 index 0000000000000000000000000000000000000000..82a877359be75c9c7ad1226b362efeeabf2edef4 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb +size 1459729952 diff --git a/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 new file mode 100644 index 0000000000000000000000000000000000000000..e362b81bf93cef8c6d96b08171bab63416808c70 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/blobs/584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 +size 4965799096 diff --git a/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00001-of-00002.safetensors b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e362b81bf93cef8c6d96b08171bab63416808c70 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584d8d3e3f82f7964955174dfe5e3b1cf117a9d859f022cfdf7fcb884856e002 +size 4965799096 diff --git a/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00002-of-00002.safetensors b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82a877359be75c9c7ad1226b362efeeabf2edef4 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/artifacts/models--meta-llama--Llama-3.2-3B/snapshots/13afe5124825b4f3751f836b40dafda64c1ed062/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4719a04514ec2f060240711b7c33ab21187cac730ecaba3040b7a0fd95a9cefb +size 1459729952 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_0.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e6f6c0d5fa3f1dc9dc7d8a6efc5eb202f3bc72bc --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597a8ecb0ce0f65c4e7449874d02a6403185578c168ac3acc602a62fc7292436 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_1.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c11b36f7fac309c0b376385d3500b7d79389f75d --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a486bd24422fab4e1b364f49b85424fa3c6f3473311e58e9ed868d1b2de3fda0 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_2.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..35ea8bb156e3d14aa6596bac40f7dbbe872bcc28 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4f2cf28f7ae5e3c3cab1c627b13348703f61bdd28206c064ffa51599199c18 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/scheduler.pt b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd2b918d8745abbf069d63eb10b5e470cf41131 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e8d7589fd595ca926efd5a06b03cac6aa101022f6c4d8ba499fff770a4c8c8 +size 627 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/tokenizer.json b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..c76f0701115b50c463b66cc3645d7a3654ab5205 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda2ecf7b5daf3cb77324ea6c5b9cb8bf47119249a6d756ef2dd4d62540ac6f +size 17210554 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/training_args.bin b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..35c83e0aeb67b51f9041a0775518d818bd4514c1 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-1800/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892167fd00638a9a336920c633c1535594e6726eea0c8de0982206892bd302fd +size 6011 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_0.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e39746492b970dcc6a87f52bb29c56fc5ba161fc --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce9e99fc568ea7d69c95f8da5622cf2e24538055df1accfbeaccff9c07072311 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_1.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..abccc0fe9164aa3960835284734191dc786ae981 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf507f5973fce5bbcb6429ce7c7164e2e033221c79824bee0dcc77248e530ab9 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_2.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6fc0da9c514e1a86118ed6e753db92d26ba258c9 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd2607e58c5b6d795789aee02c9a0a2d71e807483894bf38b21ea6bacd6acfa +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/scheduler.pt b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..802bfd1ebc11e7c0419f3d56c8e73bca6baa30b5 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0412d9421ae5a006db5668e62644e7e5fad7dadb27e37d6cca0640e73c49f4 +size 627 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/tokenizer.json b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..c76f0701115b50c463b66cc3645d7a3654ab5205 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda2ecf7b5daf3cb77324ea6c5b9cb8bf47119249a6d756ef2dd4d62540ac6f +size 17210554 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-200/training_args.bin b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..35c83e0aeb67b51f9041a0775518d818bd4514c1 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-200/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892167fd00638a9a336920c633c1535594e6726eea0c8de0982206892bd302fd +size 6011 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_0.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..12d8f134d0ace768aa9a4fc9a1c7787b2ce68b40 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd745605ae8f150c3645104631b2d3c3b452eecda3ab1f66d0a3f474af022ff +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_1.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7255d4b96382a76a01d62b0f3fb8ed7ba214a8cf --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab5d049f3d3fc102f2df0c1651bc9d13107a3c0c772fd671f399b9d7d1de545 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_2.pth b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf2513c6be393ffd7f18b9966efe1ea94961ce76 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e03f5804d1958af28b457d1c95eadeccb6d55a564daf236124a0bd65854c268 +size 16567 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/scheduler.pt b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2636b79ff2eb973cb99847a892eaf582e7ca55fe --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f075f7d0170ab60037de0c2b26d268f08d97a6f30854894cee8dba12ae0ba147 +size 627 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/tokenizer.json b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..c76f0701115b50c463b66cc3645d7a3654ab5205 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda2ecf7b5daf3cb77324ea6c5b9cb8bf47119249a6d756ef2dd4d62540ac6f +size 17210554 diff --git a/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/training_args.bin b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..35c83e0aeb67b51f9041a0775518d818bd4514c1 --- /dev/null +++ b/babylm_reverse_control_10M_seed0/runs/checkpoint-2700/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892167fd00638a9a336920c633c1535594e6726eea0c8de0982206892bd302fd +size 6011 diff --git a/babylm_reverse_full_10M_seed0/runs/checkpoint-1000/model-00001-of-00002.safetensors b/babylm_reverse_full_10M_seed0/runs/checkpoint-1000/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2afeb1dc855f7e2105e8ea9a196fdd906ed6857 --- /dev/null +++ b/babylm_reverse_full_10M_seed0/runs/checkpoint-1000/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54705381e2048ef8cc8064b0971611223149714b5fac2a8c7bf5b554ed3dee1 +size 4965798912 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1200/model-00002-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1200/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edfa2d722dbdb6cd464c435d498b9c3d8af39c31 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1200/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d389e3f55ac39d5a71950704f8e6ce2e7f39386d2ec4b22a7fbf3ad0793d95 +size 2247734920 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_0.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5509f0e1ece25901639e38b63337f0f28e33b98d --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0123f1b841cbb90ad2cc1a10c38027bc63872dc02a831b18d254a6186f0ffff0 +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_1.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdaddc4981c690246dfa665b10da40b38a679bc3 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e82dbca3ee98b4aff4d87464271202c99a718b90530a7719851b8b6a191547 +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_2.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd1ca9202bb0004e7be63108d043e05db918daf3 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc0a29e8caac820aa227d61191352d70074e7bc59c8656d34721d88d568ccb2 +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/scheduler.pt b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec5f7bd05f13db1133b65abf3adad94122fb1c8c --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:535e85e29b289ae27e42bbc01d5f9f60bb0732f7e838f447fec6e6bcbb245d0f +size 627 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/tokenizer.json b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..d0af2aebd22a29e048ac5f32c95a99f6ee0f465b --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fba7b84ac8c089d417b794dfc0527040604b90e2cdfe6e9df5b55afe9eab61a +size 17210282 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/training_args.bin b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..cfafb617743c42a0be1f4d87e5cb3b3292f2ced8 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1600/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cfed0422f99f2449cf26f92edc99e3943bd57b7b5a4d7721a570513f8f8678 +size 6011 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1700/model-00002-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1700/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2865e2181fe49945b7a477c30cafd9a322b10832 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1700/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45370e503bd2a6efe4a0f09381b06ee179fe76e5eccb149af5863852ef40f6c +size 2247734920 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-1900/model-00002-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1900/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0cf560d1bffed435679418ce9c5479f3708e450d --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-1900/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b0e840c77e2430f511f02fca93ffb3c4b0f76d1fdafb68a4ec3ec34c4b590b +size 2247734920 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_0.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9829253a45a30486360d23ef44a31e49a0fbb37c --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1200c6256bb3c5211e1fa1cfcea6721e1b8871fd3c8953a59bf49a59f67404c +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_1.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed05b8eb12ac744b29eb407adca7ab9af789a745 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b59dfa224b09069bb1265a6a5cb86c22c34f53669b17ebd9335621f959bf7a4 +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_2.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a26252516294710c0550a7751d8c4bc072b73762 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316a81119e1ab6e1b3e5b9d890ce1d0ca9ea9223094844fdcf8b7d9f0f4bb6c2 +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/scheduler.pt b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e212171e630d6c51c62b8d2b6d958535b421c648 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15eb4a96c60fdafb3fc2f4d6e3b92bcc3a95a78c290add6b6de7f594d5379ad0 +size 627 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/tokenizer.json b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..d0af2aebd22a29e048ac5f32c95a99f6ee0f465b --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fba7b84ac8c089d417b794dfc0527040604b90e2cdfe6e9df5b55afe9eab61a +size 17210282 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/training_args.bin b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..cfafb617743c42a0be1f4d87e5cb3b3292f2ced8 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2100/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cfed0422f99f2449cf26f92edc99e3943bd57b7b5a4d7721a570513f8f8678 +size 6011 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2500/model-00002-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2500/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6283ab01fe8a6fcd4936bd7461e9b45deacf4906 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2500/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b544451972d39053e4e2b44d0796fad7d6554e22133d1906045714cdb13f4066 +size 2247734920 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_0.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..db29a0595c2ddd565d58836a14fe12c1b2df5f08 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c9638a11bb45425f36b41a0b4374e9827e8f164ff57dd09fd085ed322ee34c +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_1.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a981f76500e16ae8aaa8c016eac9d24eb11c25a8 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa48289d1791eec8b3c9bccdb5e89dbe839e263cee93f50324f2c4f1ffe6a9e +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_2.pth b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf02b213af07ae4a6ed4e0fa4c8901e406305380 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c98b3e78f020ee73e4ff068e66643eb1dd3392fbe2e0e05acca1eb4d08f74cc +size 16567 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/scheduler.pt b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7a34964f527da90d8c824d7c916ec1dac402a96 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38171f5daa427b0be124804f5c10af3088c699dc8cff611c060d7ae2975bc3f9 +size 627 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/tokenizer.json b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..d0af2aebd22a29e048ac5f32c95a99f6ee0f465b --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fba7b84ac8c089d417b794dfc0527040604b90e2cdfe6e9df5b55afe9eab61a +size 17210282 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/training_args.bin b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..cfafb617743c42a0be1f4d87e5cb3b3292f2ced8 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-2900/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cfed0422f99f2449cf26f92edc99e3943bd57b7b5a4d7721a570513f8f8678 +size 6011 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-600/model-00002-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-600/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f88826e325475f55c26ada7e4c8a978b8539892 --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-600/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015549dd35763cd99e0293a8b8463e54c9d6fe807ad0c3899366633076854a21 +size 2247734920 diff --git a/babylm_reverse_partial_10M_seed0/runs/checkpoint-900/model-00001-of-00002.safetensors b/babylm_reverse_partial_10M_seed0/runs/checkpoint-900/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3312a1cb3f3ad4495d38a84bb1152ee78b0f37ca --- /dev/null +++ b/babylm_reverse_partial_10M_seed0/runs/checkpoint-900/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d603c0c2e891aa3b2b5d80bb2218b9e1353955c268ea46c2839f622f07377d +size 4965798912