Commit
·
9e910dc
1
Parent(s):
d1c73ed
Upload intfloat/e5-large-v2 ctranslate fp16 weights
Browse files
README.md
CHANGED
|
@@ -2630,12 +2630,11 @@ model = EncoderCT2fromHfHub(
|
|
| 2630 |
# load in int8 on CUDA
|
| 2631 |
model_name_or_path=model_name,
|
| 2632 |
device="cuda",
|
| 2633 |
-
compute_type="
|
| 2634 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
| 2635 |
)
|
| 2636 |
outputs = model.generate(
|
| 2637 |
-
text=["
|
| 2638 |
-
max_length=64,
|
| 2639 |
)
|
| 2640 |
print(outputs.shape, outputs)
|
| 2641 |
```
|
|
|
|
| 2630 |
# load in int8 on CUDA
|
| 2631 |
model_name_or_path=model_name,
|
| 2632 |
device="cuda",
|
| 2633 |
+
compute_type="float16",
|
| 2634 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
| 2635 |
)
|
| 2636 |
outputs = model.generate(
|
| 2637 |
+
text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
|
|
|
|
| 2638 |
)
|
| 2639 |
print(outputs.shape, outputs)
|
| 2640 |
```
|