Update README.md
Browse files
README.md
CHANGED
|
@@ -165,7 +165,7 @@ lm_eval --model hf --model_args pretrained=$MODEL --tasks mmlu --device cuda:0 -
|
|
| 165 |
| Memory (tested on H100) | | |
|
| 166 |
|----------------------------------|----------------|-------------------------------|
|
| 167 |
| | Qwen3-32B | Qwen3-32B-float8dq |
|
| 168 |
-
| Peak Memory | 65.72 GB | 34.54 GB (
|
| 169 |
|
| 170 |
<details>
|
| 171 |
<summary> Reproduce Peak Memory Usage Results </summary>
|
|
|
|
| 165 |
| Memory (tested on H100) | | |
|
| 166 |
|----------------------------------|----------------|-------------------------------|
|
| 167 |
| | Qwen3-32B | Qwen3-32B-float8dq |
|
| 168 |
+
| Peak Memory | 65.72 GB | 34.54 GB (47.44% reduction) |
|
| 169 |
|
| 170 |
<details>
|
| 171 |
<summary> Reproduce Peak Memory Usage Results </summary>
|