Add files using upload-large-folder tool
Browse files- .gitattributes +17 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1934/model-00006-of-00006.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_2.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_3.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/scheduler.pt +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors +3 -0
.gitattributes
CHANGED
@@ -91,3 +91,20 @@ checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwe
|
|
91 |
checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
92 |
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
93 |
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
91 |
checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
92 |
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
93 |
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
94 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
|
95 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
|
96 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text
|
97 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
|
98 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
|
99 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
100 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
101 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
|
102 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
|
103 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
|
104 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text
|
105 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
|
106 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
|
107 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
108 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
109 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
|
110 |
+
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:037a6104e8d346446495b5eac65e6f95f767784bb86976a522ba1d8d2ebccf38
|
3 |
+
size 4986211200
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16ec32d87e8ce5e68825f56556a248a320087a2dec560d944de46d7743126f9d
|
3 |
+
size 4954847240
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:148a793687797aba9facb0b118201df3db239818567d2276b22a1dd1b9a6cfaa
|
3 |
+
size 4954847280
|
checkpoints/Qwen2.5-14B/babylm_shuffle_control_10M_seed0/runs/checkpoint-1934/model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fa9f0f8b233569b82cd667e8c5ca8dc427eec8eca49dd45aa0a3438a645cf52
|
3 |
+
size 4734533096
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15cf6eeb694c805493de414d07ff667947929feec9e4f0fcf42ce5cf0a018ddb
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdeb95f762226d00df8620ef583da32215d9a73bfb95bb43993ef6983a7ee1b9
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70e891007ffa086a3d99eebe131f1ed9435b0a35734c7e565ed116cb48c8c3f4
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d912986edede51d039c7a1938014cdbf5c5652c76b4bc1e02a0281b27110931
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e667a7d18d94098aefa2473386a7a3e456dff729cdf04a1f060f32b0d8b8fe7
|
3 |
+
size 11422176
|
checkpoints/Qwen2.5-14B/babylm_shuffle_deterministic84_10M_seed0/runs/checkpoint-1934/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f191cf2b92afb8bbc237c787c0a30b450f779f0671380457f9f73b0ca14995b0
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_shuffle_even_odd_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|