Upload folder using huggingface_hub
Browse files- .gitattributes +32 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json +3 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json +35 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json +1 -0
- llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt +3 -0
.gitattributes
CHANGED
@@ -3289,3 +3289,35 @@ llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/
|
|
3289 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3290 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3291 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3289 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3290 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3291 |
llamascope-slimpj-openr1-res-32k/30-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.30.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
3292 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json filter=lfs diff=lfs merge=lfs -text
|
3293 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json filter=lfs diff=lfs merge=lfs -text
|
3294 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json filter=lfs diff=lfs merge=lfs -text
|
3295 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json filter=lfs diff=lfs merge=lfs -text
|
3296 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json filter=lfs diff=lfs merge=lfs -text
|
3297 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json filter=lfs diff=lfs merge=lfs -text
|
3298 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json filter=lfs diff=lfs merge=lfs -text
|
3299 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json filter=lfs diff=lfs merge=lfs -text
|
3300 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json filter=lfs diff=lfs merge=lfs -text
|
3301 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json filter=lfs diff=lfs merge=lfs -text
|
3302 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json filter=lfs diff=lfs merge=lfs -text
|
3303 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json filter=lfs diff=lfs merge=lfs -text
|
3304 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json filter=lfs diff=lfs merge=lfs -text
|
3305 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json filter=lfs diff=lfs merge=lfs -text
|
3306 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json filter=lfs diff=lfs merge=lfs -text
|
3307 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json filter=lfs diff=lfs merge=lfs -text
|
3308 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json filter=lfs diff=lfs merge=lfs -text
|
3309 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json filter=lfs diff=lfs merge=lfs -text
|
3310 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json filter=lfs diff=lfs merge=lfs -text
|
3311 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json filter=lfs diff=lfs merge=lfs -text
|
3312 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json filter=lfs diff=lfs merge=lfs -text
|
3313 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json filter=lfs diff=lfs merge=lfs -text
|
3314 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json filter=lfs diff=lfs merge=lfs -text
|
3315 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json filter=lfs diff=lfs merge=lfs -text
|
3316 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json filter=lfs diff=lfs merge=lfs -text
|
3317 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json filter=lfs diff=lfs merge=lfs -text
|
3318 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json filter=lfs diff=lfs merge=lfs -text
|
3319 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json filter=lfs diff=lfs merge=lfs -text
|
3320 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json filter=lfs diff=lfs merge=lfs -text
|
3321 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3322 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3323 |
+
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71aab43878483371d224f38eb1ad55e043081b724358eefccf37bc26e7620097
|
3 |
+
size 99448678
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fde0235a85cb5d96636b1cbb0d6beb554d74f176a3cdfeb1defaebd01623943
|
3 |
+
size 99890428
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0612814da3cb33d8d2eb1f75dc5f2a4909b0160d75bf383476f60398edf9ae32
|
3 |
+
size 99251520
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4920256b4ec6cb05c25db04578386b5f7a699bf0c137b5dd4441484a2c2fce0e
|
3 |
+
size 99661384
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87c76337cce812e69f02ef7754f4a5cc19a3142359e3bff8cf117b67292d09e6
|
3 |
+
size 98975210
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2a780b710d5b9d40280efeed5155b41cd87757696af0093a6eb44eca7ea3cf5
|
3 |
+
size 98879771
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e274f0f3c374d1bf25d447f4109ca13510d9995974dee12f43301f1a0117010
|
3 |
+
size 100320423
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59fe05b5f0f9394edea3033ce4d8e5c7d98c668171d3deba787a7d899fabbd4e
|
3 |
+
size 99637438
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:593905039fe3686fc38c69104be5dd1353c0000c4131a3ddbe83499a9fd92209
|
3 |
+
size 98963498
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d885b819415eed988f08b967b34d0bf31ee0b3212df3314da4fef62bed68d2dd
|
3 |
+
size 99552705
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db2b30e5acaf033a2ac797620bfd5f9b102e7721cd84628868d5732cf38a06a8
|
3 |
+
size 100399459
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bef6d6ca9c8b3e48b2abb39f419e57a097020985ea15b0268a7f35f04213aeb9
|
3 |
+
size 99359211
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de20bee3f8ba29f37c7ffdb065e91be3908a57fc45d48a619d8d0251d9b136b2
|
3 |
+
size 100380525
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cfe1458750b3002b6759cb892feec1fe91833ad9da3ffc14018cfec2bad127f
|
3 |
+
size 99455088
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f303bf6c91bb25400810fe192241c4166eff27dc356c642765f6195ff9b86c04
|
3 |
+
size 99193394
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22c21c5f634e8c88a7a70ccf5028524d44f6b9c9feb132df21c29e277f7e042a
|
3 |
+
size 99797117
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45ca6c3f7fe94f9338c296cf8cf297c25d874b1dcead16478df75c1b45fa8b54
|
3 |
+
size 99552349
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:339d17c86b8fea1357912d0f1f88ca53435ba97378c2e19b67ed2d4ff36d2cb3
|
3 |
+
size 100528029
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c2eec62fcbfdf38e78fc8b2fbdb84e4071b5c589ac245cc6a9225bdf1326ebc
|
3 |
+
size 99295263
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45564dde55aec0bfb9bbeacc20c70f342a45726b0a0bbe7160501ce510c9102c
|
3 |
+
size 99432712
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aa8454d9deabc22a3e1ddc935b9e4ffd6bb35349ed0e5895596cc2c1de126dc
|
3 |
+
size 99312364
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ec477035b1632e11144c0bc4c6dc9617ada4b7e33f3ef675f1b2024fb727238
|
3 |
+
size 98866949
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0aaffa8968627bf6a0eb4eadffc79750b99dde4ceeef18f8094401af3ff4db47
|
3 |
+
size 99334666
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d84e00403ec87284f5ef3f59d6ecccb432c8b6dcd9dad5bbe2765dd2d4ec2e2c
|
3 |
+
size 99617719
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95bf2456a0692c67acf16ab0c3fa25b0fddea75aebbf80df4a9da0a10e0ec49d
|
3 |
+
size 99498575
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77cf0a4100a0631d947de0ab40ab15dce9e518a6f7863702ea90e86570f5b265
|
3 |
+
size 100086828
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f54f05b1ff548158f001161937d22b6a39e817fedfb78573cc4aae130820928
|
3 |
+
size 99256207
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:852988366b719bbfbb3c0ebcc309fae11dd1ae636187c9e25eda829632fd63d4
|
3 |
+
size 99846515
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f915973875408899ec8dd0375d8a0510449a5b0795a6b689dab875e3055e917
|
3 |
+
size 99754017
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee39d42a3be447e74bafe2dfee5208bca9323a4e1e8b8253632a5e0db7956429
|
3 |
+
size 99783904
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e44cd9c89760ea8fb00b1dd28b64e9c1c0525dec608cc09bc750c3567bb3dfe
|
3 |
+
size 100261923
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85458d15aa6dea598a65a7cc1c88406d2a8cb7c8dca30775de4c329279419943
|
3 |
+
size 99481021
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"sae_set": "llama_scope_r1_distill",
|
3 |
+
"sae_path": "31-llamascope-openr1-res-32k",
|
4 |
+
"outputs_dir": "31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768",
|
5 |
+
"np_sae_id_suffix": null,
|
6 |
+
"np_set_name": null,
|
7 |
+
"from_local_sae": false,
|
8 |
+
"sparsity_threshold": -6,
|
9 |
+
"huggingface_dataset_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/data/OpenR1-Math-220k",
|
10 |
+
"n_prompts_total": 24576,
|
11 |
+
"n_tokens_in_prompt": 128,
|
12 |
+
"n_prompts_in_forward_pass": 256,
|
13 |
+
"n_features_at_a_time": 1024,
|
14 |
+
"quantile_feature_batch_size": 64,
|
15 |
+
"start_batch": 0,
|
16 |
+
"end_batch": null,
|
17 |
+
"n_quantiles": 5,
|
18 |
+
"top_acts_group_size": 30,
|
19 |
+
"quantile_group_size": 5,
|
20 |
+
"use_dfa": false,
|
21 |
+
"model_dtype": "bfloat16",
|
22 |
+
"sae_dtype": "bfloat16",
|
23 |
+
"model_id": "meta-llama/Llama-3.1-8B",
|
24 |
+
"layer": 31,
|
25 |
+
"sae_device": "cuda",
|
26 |
+
"activation_store_device": "cuda",
|
27 |
+
"model_device": "cuda",
|
28 |
+
"model_n_devices": 1,
|
29 |
+
"use_wandb": false,
|
30 |
+
"shuffle_tokens": true,
|
31 |
+
"prefix_tokens": null,
|
32 |
+
"suffix_tokens": null,
|
33 |
+
"ignore_positions": null,
|
34 |
+
"hf_model_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/models/DeepSeek-R1-Distill-Llama-8B"
|
35 |
+
}
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"model_id": "meta-llama/Llama-3.1-8B", "layer": "31", "sae_set": "llama_scope_r1_distill", "log_sparsity": -6, "skipped_indexes": []}
|
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6432be59b474d4752bbab38fa295adf642a4cb737ad2aea8fd972a5eaaa3182e
|
3 |
+
size 25167029
|