michaelfeil
commited on
Commit
•
7df365d
1
Parent(s):
1881f31
Update README.md
Browse files
README.md
CHANGED
@@ -24,7 +24,7 @@ model = TranslatorCT2fromHfHub(
|
|
24 |
# load in int8 on CUDA
|
25 |
model_name_or_path=model_name,
|
26 |
device="cuda",
|
27 |
-
compute_type="
|
28 |
)
|
29 |
outputs = model.generate(
|
30 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|
|
|
24 |
# load in int8 on CUDA
|
25 |
model_name_or_path=model_name,
|
26 |
device="cuda",
|
27 |
+
compute_type="int8_float16"
|
28 |
)
|
29 |
outputs = model.generate(
|
30 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|