michaelfeil
commited on
Commit
·
891cbdf
1
Parent(s):
f8dfe8e
Update README.md
Browse files
README.md
CHANGED
@@ -25,7 +25,7 @@ model = TranslatorCT2fromHfHub(
|
|
25 |
# load in int8 on CUDA
|
26 |
model_name_or_path=model_name,
|
27 |
device="cuda",
|
28 |
-
compute_type="
|
29 |
)
|
30 |
outputs = model.generate(
|
31 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|
|
|
25 |
# load in int8 on CUDA
|
26 |
model_name_or_path=model_name,
|
27 |
device="cuda",
|
28 |
+
compute_type="int8_float16"
|
29 |
)
|
30 |
outputs = model.generate(
|
31 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|