Update README.md
Browse files
README.md
CHANGED
@@ -38,7 +38,7 @@ python3 quantize_quark.py \
|
|
38 |
--output_dir deepseek-moe-16b-chat-FP8-KV \
|
39 |
--quant_scheme w_fp8_a_fp8 \
|
40 |
--kv_cache_dtype fp8 \
|
41 |
-
|
42 |
--model_export quark_safetensors \
|
43 |
--no_weight_matrix_merge \
|
44 |
--multi_gpu
|
|
|
38 |
--output_dir deepseek-moe-16b-chat-FP8-KV \
|
39 |
--quant_scheme w_fp8_a_fp8 \
|
40 |
--kv_cache_dtype fp8 \
|
41 |
+
--num_calib_data 128 \
|
42 |
--model_export quark_safetensors \
|
43 |
--no_weight_matrix_merge \
|
44 |
--multi_gpu
|