SiliconThaumaturgy commited on
Commit
627809c
·
verified ·
1 Parent(s): efee023

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -34,4 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  assets/intro_2.jpg filter=lfs diff=lfs merge=lfs -text
37
- Marco-o1-rk3588-w8a8-opt-1-hybrid-ratio-0.0.rkllm filter=lfs diff=lfs merge=lfs -text
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  assets/intro_2.jpg filter=lfs diff=lfs merge=lfs -text
37
+ Marco-o1-rk3588-w8a8_g512-opt-1-hybrid-ratio-0.0.rkllm filter=lfs diff=lfs merge=lfs -text
Marco-o1-rk3588-w8a8_g512-opt-1-hybrid-ratio-0.0.rkllm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2830fd52bda7c776b9612d50f76163cf695377f1cfb3e7ef148102a9faa8c2e6
3
+ size 8306798924
README.md CHANGED
@@ -5,7 +5,7 @@ inference: false
5
  ---
6
  # Marco-o1-RK3588-1.1.2
7
 
8
- This version of Marco-o1 has been converted to run on the RK3588 NPU using w8a8 quantization.
9
 
10
  This model has been optimized with the following LoRA:
11
 
 
5
  ---
6
  # Marco-o1-RK3588-1.1.2
7
 
8
+ This version of Marco-o1 has been converted to run on the RK3588 NPU using w8a8_g512 quantization.
9
 
10
  This model has been optimized with the following LoRA:
11