Update README.md
Browse files
README.md
CHANGED
@@ -144,6 +144,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
144 |
--tokenizer=$MODEL_PATH \
|
145 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
146 |
--speculator_source=hf \
|
|
|
147 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
148 |
--prompt_type=code \
|
149 |
--compile \
|
@@ -161,6 +162,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
161 |
--tokenizer=$MODEL_PATH \
|
162 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
163 |
--speculator_source=hf \
|
|
|
164 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
165 |
--prompt_type=code \
|
166 |
--compile \
|
@@ -177,6 +179,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
|
|
177 |
--tokenizer=$MODEL_PATH \
|
178 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
179 |
--speculator_source=hf \
|
|
|
180 |
--batch_input \
|
181 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
182 |
--prompt_type=code \
|
|
|
144 |
--tokenizer=$MODEL_PATH \
|
145 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
146 |
--speculator_source=hf \
|
147 |
+
--speculator_variant=2b \
|
148 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
149 |
--prompt_type=code \
|
150 |
--compile \
|
|
|
162 |
--tokenizer=$MODEL_PATH \
|
163 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
164 |
--speculator_source=hf \
|
165 |
+
--speculator_variant=2b \
|
166 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
167 |
--prompt_type=code \
|
168 |
--compile \
|
|
|
179 |
--tokenizer=$MODEL_PATH \
|
180 |
--speculator_path=ibm-fms/codellama-13b-accelerator \
|
181 |
--speculator_source=hf \
|
182 |
+
--speculator_variant=2b \
|
183 |
--batch_input \
|
184 |
--top_k_tokens_per_head=4,3,2,2,2,2,2 \
|
185 |
--prompt_type=code \
|