bowenbaoamd commited on
Commit
3c59ff8
·
verified ·
1 Parent(s): df42951

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -38,7 +38,7 @@ python3 quantize_quark.py \
38
         --output_dir deepseek-moe-16b-chat-FP8-KV \
39
         --quant_scheme w_fp8_a_fp8 \
40
         --kv_cache_dtype fp8 \
41
-        --num_calib_data 128 \
42
         --model_export quark_safetensors \
43
  --no_weight_matrix_merge \
44
         --multi_gpu
 
38
         --output_dir deepseek-moe-16b-chat-FP8-KV \
39
         --quant_scheme w_fp8_a_fp8 \
40
         --kv_cache_dtype fp8 \
41
+ --num_calib_data 128 \
42
         --model_export quark_safetensors \
43
  --no_weight_matrix_merge \
44
         --multi_gpu