Zack Li
commited on
Commit
•
1f09c6d
1
Parent(s):
7f2687d
Update README.md
Browse files
README.md
CHANGED
@@ -64,7 +64,7 @@ def inference(input_text):
|
|
64 |
end_time = time.time()
|
65 |
return {"output": res, "latency": end_time - start_time}
|
66 |
|
67 |
-
model_id = "NexaAIDev/
|
68 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
69 |
model = GemmaForCausalLM.from_pretrained(
|
70 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|
|
|
64 |
end_time = time.time()
|
65 |
return {"output": res, "latency": end_time - start_time}
|
66 |
|
67 |
+
model_id = "NexaAIDev/Octopus-v2"
|
68 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
69 |
model = GemmaForCausalLM.from_pretrained(
|
70 |
model_id, torch_dtype=torch.bfloat16, device_map="auto"
|