Update README.md
Browse files
README.md
CHANGED
@@ -88,16 +88,16 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
88 |
model_stub, torch_dtype="auto", device_map="auto"
|
89 |
)
|
90 |
|
|
|
|
|
91 |
output_dir = f"./{model_name}-FP8-dynamic"
|
92 |
|
93 |
oneshot(
|
94 |
model=model,
|
95 |
recipe=recipe,
|
96 |
-
output_dir=output_dir,
|
97 |
-
tokenizer=AutoTokenizer.from_pretrained(model_stub),
|
98 |
)
|
99 |
|
100 |
-
model.save_pretrained(output_dir, save_compressed=True
|
101 |
tokenizer.save_pretrained(output_dir)
|
102 |
```
|
103 |
</details>
|
|
|
88 |
model_stub, torch_dtype="auto", device_map="auto"
|
89 |
)
|
90 |
|
91 |
+
tokenizer = AutoTokenizer.from_pretrained(model_stub)
|
92 |
+
|
93 |
output_dir = f"./{model_name}-FP8-dynamic"
|
94 |
|
95 |
oneshot(
|
96 |
model=model,
|
97 |
recipe=recipe,
|
|
|
|
|
98 |
)
|
99 |
|
100 |
+
model.save_pretrained(output_dir, save_compressed=True)
|
101 |
tokenizer.save_pretrained(output_dir)
|
102 |
```
|
103 |
</details>
|