JRosenkranz commited on
Commit
ab784c3
·
verified ·
1 Parent(s): f392e11

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -0
README.md CHANGED
@@ -144,6 +144,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
144
  --tokenizer=$MODEL_PATH \
145
  --speculator_path=ibm-fms/codellama-13b-accelerator \
146
  --speculator_source=hf \
 
147
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
148
  --prompt_type=code \
149
  --compile \
@@ -161,6 +162,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
161
  --tokenizer=$MODEL_PATH \
162
  --speculator_path=ibm-fms/codellama-13b-accelerator \
163
  --speculator_source=hf \
 
164
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
165
  --prompt_type=code \
166
  --compile \
@@ -177,6 +179,7 @@ python fms-extras/scripts/paged_speculative_inference.py \
177
  --tokenizer=$MODEL_PATH \
178
  --speculator_path=ibm-fms/codellama-13b-accelerator \
179
  --speculator_source=hf \
 
180
  --batch_input \
181
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
182
  --prompt_type=code \
 
144
  --tokenizer=$MODEL_PATH \
145
  --speculator_path=ibm-fms/codellama-13b-accelerator \
146
  --speculator_source=hf \
147
+ --speculator_variant=2b \
148
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
149
  --prompt_type=code \
150
  --compile \
 
162
  --tokenizer=$MODEL_PATH \
163
  --speculator_path=ibm-fms/codellama-13b-accelerator \
164
  --speculator_source=hf \
165
+ --speculator_variant=2b \
166
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
167
  --prompt_type=code \
168
  --compile \
 
179
  --tokenizer=$MODEL_PATH \
180
  --speculator_path=ibm-fms/codellama-13b-accelerator \
181
  --speculator_source=hf \
182
+ --speculator_variant=2b \
183
  --batch_input \
184
  --top_k_tokens_per_head=4,3,2,2,2,2,2 \
185
  --prompt_type=code \