diff --git a/.gitattributes b/.gitattributes index b759f54c5a1505fd41a10319875a6953c787bcc2..7a560dd80e4c41ccf883ac39f7c4bb12dd67dca9 100644 --- a/.gitattributes +++ b/.gitattributes @@ -59,3 +59,20 @@ checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/artifacts/models--Qwen- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/tokenizer.json filter=lfs diff=lfs merge=lfs -text checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e new file mode 100644 index 0000000000000000000000000000000000000000..885c5514c7a9ebb84bfecbccb6f7281ef4592b6d --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +size 3979614448 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..383698ee64c0b8e0ec66f9ffc0f75af212855bee --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03bbc4b3b2b35894d533efe6514b73480926ea27 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e238a7a4dec4d38d336806d198ab64df5b042d76 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba new file mode 100644 index 0000000000000000000000000000000000000000..e238a7a4dec4d38d336806d198ab64df5b042d76 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb new file mode 100644 index 0000000000000000000000000000000000000000..383698ee64c0b8e0ec66f9ffc0f75af212855bee --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 new file mode 100644 index 0000000000000000000000000000000000000000..c9a026a826f7bcb4b1206bf4953c9690e20c2875 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +size 3995327992 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9a026a826f7bcb4b1206bf4953c9690e20c2875 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +size 3995327992 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03bbc4b3b2b35894d533efe6514b73480926ea27 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e238a7a4dec4d38d336806d198ab64df5b042d76 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba new file mode 100644 index 0000000000000000000000000000000000000000..e238a7a4dec4d38d336806d198ab64df5b042d76 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb new file mode 100644 index 0000000000000000000000000000000000000000..383698ee64c0b8e0ec66f9ffc0f75af212855bee --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 new file mode 100644 index 0000000000000000000000000000000000000000..03bbc4b3b2b35894d533efe6514b73480926ea27 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f new file mode 100644 index 0000000000000000000000000000000000000000..dd1309620ebee47f63ac40b9b235b7ae5f9711e6 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +size 1698724408 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e new file mode 100644 index 0000000000000000000000000000000000000000..885c5514c7a9ebb84bfecbccb6f7281ef4592b6d --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +size 3979614448 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa new file mode 100644 index 0000000000000000000000000000000000000000..0504bafae1ddcbc85d48285c87c8321cbaff57fc --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +size 3885134104 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 new file mode 100644 index 0000000000000000000000000000000000000000..c9a026a826f7bcb4b1206bf4953c9690e20c2875 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +size 3995327992 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0504bafae1ddcbc85d48285c87c8321cbaff57fc --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +size 3885134104 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9a026a826f7bcb4b1206bf4953c9690e20c2875 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +size 3995327992 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..383698ee64c0b8e0ec66f9ffc0f75af212855bee --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f52854c5a074379894d35c1a1ba7fc3c95b852e4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +size 3995348776 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..885c5514c7a9ebb84bfecbccb6f7281ef4592b6d --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +size 3979614448 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03bbc4b3b2b35894d533efe6514b73480926ea27 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e238a7a4dec4d38d336806d198ab64df5b042d76 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +size 3995328064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd1309620ebee47f63ac40b9b235b7ae5f9711e6 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +size 1698724408 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_0.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef6e67676ca0c8b9758d9494bfd095bd55feda7a --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ae0f8c0973bd8f49e7d475791e1334e0204d90696971f9983ce5cb629db508 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_1.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..66abb3609cddbe9625581ad142516353a486a510 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582deaed4156b10690b3823f0fabd8dc67208eff035e24ae52cd85b9d874bb8a +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_2.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..635ffa617d1c8b1d59a090f5f803c76bae03ee82 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c0d37a6d8b99cbd89650c46b5f2f132c4da338c68ff6d192f08a6bcefbbceb5 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_3.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f14ac5d45b1965e0d81a159cedafcad304f854d --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbdf9f0e9aac95e08af74c5bf009639eb93bbb564c71abd5e3aa81adf1c3991b +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/scheduler.pt b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4398f46c86eb8e25a5e9ac3b07fe5c7ac56953d4 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b1826aaba117362f4adfc02c2de0205a70775a4b414256a9c9ffbc64365305 +size 1064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3b14f8affb24073c5b5274674f70277c042593dc --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516 +size 11422356 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/training_args.bin b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..21f3bde4181aa964096261b96113a6dfa4061736 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d6815084f9707f1d8d990ce7c2269742cc992d1a36e2e1dceb5b67e6def274 +size 6520 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_0.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3dccc4cb6b04d481f1f29e054a722eefdff1fbf2 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31effcc966f4272bd7330ebcde7da65f7dbd70afe27a289d2a31856fbc63f379 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_1.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..98cfa5867d6ec56d2eee7c67b44f5fd61d4e09ab --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99672ac4c61aff9b2bca8a9e80f74417b8b0767809c3454f66042d5f904ced7a +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_2.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..347d2b1332054c3a9112df0605ef33aba35b9aa3 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0365624c9f07469b8549f58376cdc199fd538b48405ad51abe3c46cc06f193ea +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_3.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..183a0ffdbeff05cf1c18d2bce5fa85734404b759 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0db9bdc225f9583b93b0affe946bd62f8983aae91455323924cab39bef020b1 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/scheduler.pt b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c15d26840978659f2b42d9cf3e3683f959c24fd --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add49698959c0d68285301bf9cf3bc2d662d3dfb40309603eebc0e6a0d5f7268 +size 1064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3b14f8affb24073c5b5274674f70277c042593dc --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516 +size 11422356 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/training_args.bin b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..21f3bde4181aa964096261b96113a6dfa4061736 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d6815084f9707f1d8d990ce7c2269742cc992d1a36e2e1dceb5b67e6def274 +size 6520 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_0.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3dccc4cb6b04d481f1f29e054a722eefdff1fbf2 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31effcc966f4272bd7330ebcde7da65f7dbd70afe27a289d2a31856fbc63f379 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_1.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..98cfa5867d6ec56d2eee7c67b44f5fd61d4e09ab --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99672ac4c61aff9b2bca8a9e80f74417b8b0767809c3454f66042d5f904ced7a +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_2.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..347d2b1332054c3a9112df0605ef33aba35b9aa3 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0365624c9f07469b8549f58376cdc199fd538b48405ad51abe3c46cc06f193ea +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_3.pth b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..183a0ffdbeff05cf1c18d2bce5fa85734404b759 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0db9bdc225f9583b93b0affe946bd62f8983aae91455323924cab39bef020b1 +size 14960 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/scheduler.pt b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c15d26840978659f2b42d9cf3e3683f959c24fd --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add49698959c0d68285301bf9cf3bc2d662d3dfb40309603eebc0e6a0d5f7268 +size 1064 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/tokenizer.json b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3b14f8affb24073c5b5274674f70277c042593dc --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516 +size 11422356 diff --git a/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/training_args.bin b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..7828183e387a5de0b73ec7526646244636841d52 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99b3b7e5e47bfbb2fda40cbb4280960d21c1009717e90fc0b42eecd86d39bff +size 6520 diff --git a/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1934/model-00005-of-00006.safetensors b/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1934/model-00005-of-00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..90bb1e5f52f32de87166fb68513cecfeb69d9687 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-1934/model-00005-of-00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0958bd57a396d1812c21ce2569ea48a9d04bc4f94ffc7422c2fd9edc743ceb00 +size 4954847280 diff --git a/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-500/model-00006-of-00006.safetensors b/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-500/model-00006-of-00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8d4e435746cc556a532535ee30f9db39671f584 --- /dev/null +++ b/checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/runs/checkpoint-500/model-00006-of-00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e410ee04332cd44975c07dc74799e2b4ede8bbbb7d02938fe38f81bc15cb343 +size 4734533096