osanseviero
commited on
Commit
•
2c8b980
1
Parent(s):
140dfaa
Fix model ID
Browse files
README.md
CHANGED
@@ -58,7 +58,7 @@ def inference(input_text):
|
|
58 |
end_time = time.time()
|
59 |
return {"output": res, "latency": end_time - start_time}
|
60 |
|
61 |
-
model_id = "NexaAIDev/
|
62 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
63 |
model = GemmaForCausalLM.from_pretrained(
|
64 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|
|
|
58 |
end_time = time.time()
|
59 |
return {"output": res, "latency": end_time - start_time}
|
60 |
|
61 |
+
model_id = "NexaAIDev/Octopus-v2"
|
62 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
63 |
model = GemmaForCausalLM.from_pretrained(
|
64 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|