Upload folder using huggingface_hub
Browse files- .gitattributes +32 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json +3 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json +35 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json +1 -0
- llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt +3 -0
.gitattributes
CHANGED
@@ -3353,3 +3353,35 @@ llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_l
|
|
3353 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3354 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3355 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3353 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3354 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3355 |
llamascope-slimpj-res-32k/31-llamascope-slimpj-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
3356 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json filter=lfs diff=lfs merge=lfs -text
|
3357 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json filter=lfs diff=lfs merge=lfs -text
|
3358 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json filter=lfs diff=lfs merge=lfs -text
|
3359 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json filter=lfs diff=lfs merge=lfs -text
|
3360 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json filter=lfs diff=lfs merge=lfs -text
|
3361 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json filter=lfs diff=lfs merge=lfs -text
|
3362 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json filter=lfs diff=lfs merge=lfs -text
|
3363 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json filter=lfs diff=lfs merge=lfs -text
|
3364 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json filter=lfs diff=lfs merge=lfs -text
|
3365 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json filter=lfs diff=lfs merge=lfs -text
|
3366 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json filter=lfs diff=lfs merge=lfs -text
|
3367 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json filter=lfs diff=lfs merge=lfs -text
|
3368 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json filter=lfs diff=lfs merge=lfs -text
|
3369 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json filter=lfs diff=lfs merge=lfs -text
|
3370 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json filter=lfs diff=lfs merge=lfs -text
|
3371 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json filter=lfs diff=lfs merge=lfs -text
|
3372 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json filter=lfs diff=lfs merge=lfs -text
|
3373 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json filter=lfs diff=lfs merge=lfs -text
|
3374 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json filter=lfs diff=lfs merge=lfs -text
|
3375 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json filter=lfs diff=lfs merge=lfs -text
|
3376 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json filter=lfs diff=lfs merge=lfs -text
|
3377 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json filter=lfs diff=lfs merge=lfs -text
|
3378 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json filter=lfs diff=lfs merge=lfs -text
|
3379 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json filter=lfs diff=lfs merge=lfs -text
|
3380 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json filter=lfs diff=lfs merge=lfs -text
|
3381 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json filter=lfs diff=lfs merge=lfs -text
|
3382 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json filter=lfs diff=lfs merge=lfs -text
|
3383 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json filter=lfs diff=lfs merge=lfs -text
|
3384 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json filter=lfs diff=lfs merge=lfs -text
|
3385 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json filter=lfs diff=lfs merge=lfs -text
|
3386 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json filter=lfs diff=lfs merge=lfs -text
|
3387 |
+
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json filter=lfs diff=lfs merge=lfs -text
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-0.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a218cc95fe2aa70626c984239f18858952f9df8089adaad8861d1dc34c5dd772
|
3 |
+
size 104189323
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-1.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4ac5236e6418f262a1502a136afacb07e2bf85d3201d775385a813ea39da291
|
3 |
+
size 104539127
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-10.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48fed52f711ff39330753606e9b17ad0d8d2557abc6348030649190d08be5fe3
|
3 |
+
size 104185701
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-11.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:487bfd6fde1fcf946ced135efddcb6b1881712006b012cafa50a5015c878ce0f
|
3 |
+
size 104335771
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-12.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c28e670a3b734f5d2d7a195baab3a2efe96bc916e59facb880609e66137081be
|
3 |
+
size 104181042
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-13.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c69c335e7c19380b6ba7cf362917d70f41a6d57c374a2de5255f227d755b5dd2
|
3 |
+
size 104915190
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-14.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:694d45f3d90b7be0a109b8661d626fa0d50cb78e6626d55a7c47f40dbb41c519
|
3 |
+
size 104434686
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-15.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90c3ea6b56da1b2981a454ce2fdb5486f1177c44be9d1fc4ae91e8568ced4098
|
3 |
+
size 104223069
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-16.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f966dd48d4a7edcf844ee7421819bd45e7df436a3c705ce006e7272dd5aed6d1
|
3 |
+
size 104648090
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-17.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:446a22e73d4ac9dd9b71cffda6a2f9a5d75ecbbaf664bb5d95b1a60d3b6c010c
|
3 |
+
size 104011986
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-18.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93b41d8c6a1059e77cd3b5532dfd61e27d966d9c0f18ef92d9949166ae8fbfa5
|
3 |
+
size 103570302
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-19.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bd3e03975735bf66ebdf1fb0d7db8dc46eb5a6820edd48d7e34610068042ccd
|
3 |
+
size 103872923
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-2.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0fb1bbf83b8b807b323171bd91c624059815f44793a28abc04775e5234771e4
|
3 |
+
size 104359285
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-20.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53932f279b4816dee26bdebd54ef80dff5b300ab27dcad66b0779ac3a6dda2af
|
3 |
+
size 104060246
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-21.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:452170019cc433563e256620036a23f77705077e91afd89a94ad816e039cf043
|
3 |
+
size 104551717
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-22.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb15c44935fc381a30e9c0817e3a062554b42a79d097dd4fcbed15c7d2498b79
|
3 |
+
size 104678061
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-23.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9278da800370e90d1944919d492f454c4b11f01216c2931d486e488f68713034
|
3 |
+
size 104252218
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-24.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d71e009bfd92ffbe9c27c09c91dd80e36b2dd9313834fe103a59a168f7f967f
|
3 |
+
size 104001906
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-25.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eb1dc5e46ef1c640d4d59739d73f411d4b2ad2eacc9b1a6e75dd7f2868cef8e
|
3 |
+
size 104436279
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-26.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38f5d2d807ce877230ed9cb8f8b8a3220db1cedcb4325b10ea5db41fc3a9a277
|
3 |
+
size 104342619
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-27.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10d0678d36c6e7bf32a966f0cc89dc2f92a9a3d304beb140d520d549c9428189
|
3 |
+
size 103996435
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-28.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41391f72a9ed349d01623f2a4ef1bea71099e6600a78aa770139ad28eb31dafc
|
3 |
+
size 104302130
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-29.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f061af15537ec2eeee73b05bcf97967aefdfac2a99946303afc329552f7fcab
|
3 |
+
size 104047309
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-3.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ff39a83db1ebabae89d55ad749a658e12dd1d19962a728afc84b3252be20558
|
3 |
+
size 104503621
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-30.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96dc8a991d7c6dbcc752b622ee8738f62d1c55e61e22eec40e55333f6ac277b3
|
3 |
+
size 104225723
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-31.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82fbdcd5427c551b5d1f9d01894c83faab1c14e69739d8600cbe4e286619c0eb
|
3 |
+
size 104076935
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-4.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20a71bf8adbc26431d5181ce91f0b8532805e27de51543f551d1b18bd38be316
|
3 |
+
size 104211831
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-5.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7505a7fcef72f731a652854eab581c33e0ff1dc2816c672f38f48649cf5de4d8
|
3 |
+
size 104188935
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-6.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f0b82db1691a3ff709c3abc6eec632fdaa18616ea993d8765aab9fae5d18821
|
3 |
+
size 104185277
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-7.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41378b35b4860e41a9609b74b80aef291243a491ef39290ff841ea51350382f7
|
3 |
+
size 103752859
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-8.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eebfb105c4e5e834f5ddfe2542adc39d0f50ad9b0fc9e3d8a6f6a91c8d894e35
|
3 |
+
size 104457432
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/batch-9.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36e93d375616c4aa6751e52f6bce7bdb1130ea786b1e8616c893f41b04da239e
|
3 |
+
size 103887507
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/run_settings.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"sae_set": "llama_scope_r1_distill",
|
3 |
+
"sae_path": "31-llamascope-slimpj-openr1-res-32k",
|
4 |
+
"outputs_dir": "31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768",
|
5 |
+
"np_sae_id_suffix": null,
|
6 |
+
"np_set_name": null,
|
7 |
+
"from_local_sae": false,
|
8 |
+
"sparsity_threshold": -6,
|
9 |
+
"huggingface_dataset_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/data/merge_for_saedashboard",
|
10 |
+
"n_prompts_total": 24576,
|
11 |
+
"n_tokens_in_prompt": 128,
|
12 |
+
"n_prompts_in_forward_pass": 256,
|
13 |
+
"n_features_at_a_time": 1024,
|
14 |
+
"quantile_feature_batch_size": 64,
|
15 |
+
"start_batch": 0,
|
16 |
+
"end_batch": null,
|
17 |
+
"n_quantiles": 5,
|
18 |
+
"top_acts_group_size": 30,
|
19 |
+
"quantile_group_size": 5,
|
20 |
+
"use_dfa": false,
|
21 |
+
"model_dtype": "bfloat16",
|
22 |
+
"sae_dtype": "bfloat16",
|
23 |
+
"model_id": "meta-llama/Llama-3.1-8B",
|
24 |
+
"layer": 31,
|
25 |
+
"sae_device": "cuda",
|
26 |
+
"activation_store_device": "cuda",
|
27 |
+
"model_device": "cuda",
|
28 |
+
"model_n_devices": 1,
|
29 |
+
"use_wandb": false,
|
30 |
+
"shuffle_tokens": true,
|
31 |
+
"prefix_tokens": null,
|
32 |
+
"suffix_tokens": null,
|
33 |
+
"ignore_positions": null,
|
34 |
+
"hf_model_path": "/inspire/hdd/ws-8207e9e2-e733-4eec-a475-cfa1c36480ba/embodied-multimodality/public/zfhe/models/DeepSeek-R1-Distill-Llama-8B"
|
35 |
+
}
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/skipped_indexes.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"model_id": "meta-llama/Llama-3.1-8B", "layer": "31", "sae_set": "llama_scope_r1_distill", "log_sparsity": -6, "skipped_indexes": []}
|
llamascope-slimpj-openr1-res-32k/31-llamascope-slimpj-openr1-res-32k/meta-llama/Llama-3.1-8B_llama_scope_r1_distill_blocks.31.hook_resid_post_32768/tokens_24576.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9f1ea268277883c510b90ceb5e0fe8b7f52d48cd9097a3621ccb7d0cf58aa57
|
3 |
+
size 25167029
|