Update README.md
Browse files
README.md
CHANGED
|
@@ -64,7 +64,7 @@ def inference(input_text):
|
|
| 64 |
end_time = time.time()
|
| 65 |
return {"output": res, "latency": end_time - start_time}
|
| 66 |
|
| 67 |
-
model_id = "NexaAIDev/
|
| 68 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 69 |
model = GemmaForCausalLM.from_pretrained(
|
| 70 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|
|
|
|
| 64 |
end_time = time.time()
|
| 65 |
return {"output": res, "latency": end_time - start_time}
|
| 66 |
|
| 67 |
+
model_id = "NexaAIDev/Octopus-v2"
|
| 68 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 69 |
model = GemmaForCausalLM.from_pretrained(
|
| 70 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|