Upload folder using huggingface_hub
Browse files- .gitattributes +32 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json +3 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json +35 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json +1 -0
- llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt +3 -0
.gitattributes
CHANGED
@@ -3321,3 +3321,35 @@ llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_l
|
|
3321 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3322 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3323 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3321 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3322 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3323 |
llamascope-openr1-res-32k/31-llamascope-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
3324 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json filter=lfs diff=lfs merge=lfs -text
|
3325 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json filter=lfs diff=lfs merge=lfs -text
|
3326 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json filter=lfs diff=lfs merge=lfs -text
|
3327 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json filter=lfs diff=lfs merge=lfs -text
|
3328 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json filter=lfs diff=lfs merge=lfs -text
|
3329 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json filter=lfs diff=lfs merge=lfs -text
|
3330 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json filter=lfs diff=lfs merge=lfs -text
|
3331 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json filter=lfs diff=lfs merge=lfs -text
|
3332 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json filter=lfs diff=lfs merge=lfs -text
|
3333 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json filter=lfs diff=lfs merge=lfs -text
|
3334 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json filter=lfs diff=lfs merge=lfs -text
|
3335 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json filter=lfs diff=lfs merge=lfs -text
|
3336 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json filter=lfs diff=lfs merge=lfs -text
|
3337 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json filter=lfs diff=lfs merge=lfs -text
|
3338 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json filter=lfs diff=lfs merge=lfs -text
|
3339 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json filter=lfs diff=lfs merge=lfs -text
|
3340 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json filter=lfs diff=lfs merge=lfs -text
|
3341 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json filter=lfs diff=lfs merge=lfs -text
|
3342 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json filter=lfs diff=lfs merge=lfs -text
|
3343 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json filter=lfs diff=lfs merge=lfs -text
|
3344 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json filter=lfs diff=lfs merge=lfs -text
|
3345 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json filter=lfs diff=lfs merge=lfs -text
|
3346 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json filter=lfs diff=lfs merge=lfs -text
|
3347 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json filter=lfs diff=lfs merge=lfs -text
|
3348 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json filter=lfs diff=lfs merge=lfs -text
|
3349 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json filter=lfs diff=lfs merge=lfs -text
|
3350 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json filter=lfs diff=lfs merge=lfs -text
|
3351 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json filter=lfs diff=lfs merge=lfs -text
|
3352 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json filter=lfs diff=lfs merge=lfs -text
|
3353 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3354 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3355 |
+
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95dda01c5c2bdcb049cc16a3fd93b4a329bbfb1cb7f7f64e1e87944b764f8abc
|
3 |
+
size 109578986
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2912a50592d886ce5770b4dccd31f9caf28927e8e3702e48fbad8c0ebc45b03
|
3 |
+
size 109472676
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd83ff6ef09d9994319d24ad5d80220e7e111d2c43ddb87d3d3bbf7be133e9e2
|
3 |
+
size 109196437
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ff769242e5c9e5c410d2cf38df41f5be194ca6076860b06df2dddcb02f82603
|
3 |
+
size 109929911
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3763af956c18c1a7eeb540909a205043f469cd25f9c712630f2fd1c47adf1d94
|
3 |
+
size 109958967
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bada986ca2edaa495f55d558052d8795660df79e6a8a505f71b44dad262a4144
|
3 |
+
size 109878420
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bbdc1f65c1462e92ac1aa999beffe4ca64d2567f3e06e06ff8c0103184710b6
|
3 |
+
size 109569059
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17cae00c55e18309041f63257dd0631e07051a878ab5eb30fff15046a952dfbf
|
3 |
+
size 110318988
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7513b8b438f693b4c9e7b004f106ad2205a5ee5234a9488bf7e2acb123acf159
|
3 |
+
size 109947891
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d9d256ad35b95070bb6da6dcc7f588b88b8ccd5ebcb32958fa880aa1830d350
|
3 |
+
size 109949777
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40d0287052a70a64c3e8310a12a8f7047932de00f6bd4ce29c5bea187c66b2bf
|
3 |
+
size 109688817
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:483fce9e1ef16cb574db758fef225b9cc8e5562fb3d7b8547b85b68be4c68e95
|
3 |
+
size 110020551
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b813610cea56dd15dda6145a93f75eeba84fbd582324551c21c3e2109d238c3
|
3 |
+
size 109292922
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2c84c8fa104d4d5027328cdcc6b07ea491070951c78f4de46b33a902d5b6ca5
|
3 |
+
size 110523648
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6efa16aa3edbb709648e693c0c555095bbad700497b214bab2ef2801a9b8435e
|
3 |
+
size 110101549
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90aa66a1b7f7000ba943a2d0b500cf198f93b0b8b5516ab99ddc99880ad68aca
|
3 |
+
size 109471012
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7057732e7d99100c340fbda6731b01bf6e17679f564cc154c99b4fcc5279ee9b
|
3 |
+
size 109230769
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c6e5e99164eb6cfc6f4c3817f3f125c9892727000d0901b0080ff8224bde1d8
|
3 |
+
size 109557491
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1be8dd2bd415a8188445833e4683d836e379db5ab161f6c284f1c6afad9d381
|
3 |
+
size 109464088
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d521f5870b82f2ceeb0ab6261c48371d9024da5253ecc9fd378bec9fbcb327a5
|
3 |
+
size 109816916
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:063148280098b55ba93af7da3592029b023766f539d51870a96cdb4247c27cc8
|
3 |
+
size 109876712
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1c6d44a920dab6929a37b6c16a4211af2605230ea2101905ce18f59d9976459
|
3 |
+
size 110029087
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77e38c29c95474834342501e9954a3c45ce180004d9e9adcc67011be4d2412d5
|
3 |
+
size 109382543
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbe9e0afd0d9c80974cb4dbecda5a32cad072aaf29437bbb29608cc6ccea32aa
|
3 |
+
size 109195880
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5460d7034458a82e825d4cf1fca7ffc5969b6d827aa49b4c75da046330a4c5d7
|
3 |
+
size 109215319
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:886d61730370367ac5801b111c753b4919664c6eda8cf5fa24855d8fca3485df
|
3 |
+
size 109756668
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b6c789cae6901b0d25add458e8dbd1a2866f4f1fd8af554833590a7c7daf86
|
3 |
+
size 109556262
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d51571a66f5c10626161b18199189ec5b9884df5f0f30300d4098245ec4cf2
|
3 |
+
size 109319125
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4746a35a45cdbeb835a9f65880109733554c866fb8da496ba9fce9dd3f3d0447
|
3 |
+
size 109228398
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9200382c1c8b115e2d9a3e44d4a9775da94670f79ff0901c6e30cbf6a0e5d08
|
3 |
+
size 109903166
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50fcd75daf5416ebe76fbed44096c5a50578542105c2e7d8968df0aa3b3cf7d8
|
3 |
+
size 109664966
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e04adca32bf30ad80d8b7eaf13e2d89aa1e7fc20e99c040fdaf93cdd04f5543
|
3 |
+
size 110493603
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"sae_set": "llama_scope_r1_distill",
|
3 |
+
"sae_path": "31-llamascope-slimpj-res-32k",
|
4 |
+
"outputs_dir": "31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768",
|
5 |
+
"np_sae_id_suffix": null,
|
6 |
+
"np_set_name": null,
|
7 |
+
"from_local_sae": false,
|
8 |
+
"sparsity_threshold": -6,
|
9 |
+
"huggingface_dataset_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/data/SlimPajama-3B",
|
10 |
+
"n_prompts_total": 24576,
|
11 |
+
"n_tokens_in_prompt": 128,
|
12 |
+
"n_prompts_in_forward_pass": 256,
|
13 |
+
"n_features_at_a_time": 1024,
|
14 |
+
"quantile_feature_batch_size": 64,
|
15 |
+
"start_batch": 0,
|
16 |
+
"end_batch": null,
|
17 |
+
"n_quantiles": 5,
|
18 |
+
"top_acts_group_size": 30,
|
19 |
+
"quantile_group_size": 5,
|
20 |
+
"use_dfa": false,
|
21 |
+
"model_dtype": "bfloat16",
|
22 |
+
"sae_dtype": "bfloat16",
|
23 |
+
"model_id": "meta-llama/Llama-3.1-8B",
|
24 |
+
"layer": 31,
|
25 |
+
"sae_device": "cuda",
|
26 |
+
"activation_store_device": "cuda",
|
27 |
+
"model_device": "cuda",
|
28 |
+
"model_n_devices": 1,
|
29 |
+
"use_wandb": false,
|
30 |
+
"shuffle_tokens": true,
|
31 |
+
"prefix_tokens": null,
|
32 |
+
"suffix_tokens": null,
|
33 |
+
"ignore_positions": null,
|
34 |
+
"hf_model_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/models/DeepSeek-R1-Distill-Llama-8B"
|
35 |
+
}
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"model_id": "meta-llama/Llama-3.1-8B", "layer": "31", "sae_set": "llama_scope_r1_distill", "log_sparsity": -6, "skipped_indexes": []}
|
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c9d02733edfd635a4339de90c8de218368f4e8e4343faba678d108baabac3dc
|
3 |
+
size 25167029
|