Update README.md
Browse files
README.md
CHANGED
@@ -36,7 +36,7 @@ python3 quantize_quark.py --model_dir "meta-llama/Llama-3.1-405B-Instruct" \
|
|
36 |
--quant_algo autosmoothquant \
|
37 |
--min_kv_scale 1.0 \
|
38 |
--model_export hf_format \
|
39 |
-
--output_dir
|
40 |
--multi_gpu
|
41 |
```
|
42 |
|
|
|
36 |
--quant_algo autosmoothquant \
|
37 |
--min_kv_scale 1.0 \
|
38 |
--model_export hf_format \
|
39 |
+
--output_dir amd/Llama-3.1-405B-Instruct-MXFP4 \
|
40 |
--multi_gpu
|
41 |
```
|
42 |
|