Commit ·
7df365d
1
Parent(s): 1881f31
Update README.md
Browse files
README.md
CHANGED
|
@@ -24,7 +24,7 @@ model = TranslatorCT2fromHfHub(
|
|
| 24 |
# load in int8 on CUDA
|
| 25 |
model_name_or_path=model_name,
|
| 26 |
device="cuda",
|
| 27 |
-
compute_type="
|
| 28 |
)
|
| 29 |
outputs = model.generate(
|
| 30 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|
|
|
|
| 24 |
# load in int8 on CUDA
|
| 25 |
model_name_or_path=model_name,
|
| 26 |
device="cuda",
|
| 27 |
+
compute_type="int8_float16"
|
| 28 |
)
|
| 29 |
outputs = model.generate(
|
| 30 |
text=["How do you call a fast Flan-ingo?", "Translate to german: How are you doing?"],
|