michaelfeil
commited on
Commit
·
9e910dc
1
Parent(s):
d1c73ed
Upload intfloat/e5-large-v2 ctranslate fp16 weights
Browse files
README.md
CHANGED
@@ -2630,12 +2630,11 @@ model = EncoderCT2fromHfHub(
|
|
2630 |
# load in int8 on CUDA
|
2631 |
model_name_or_path=model_name,
|
2632 |
device="cuda",
|
2633 |
-
compute_type="
|
2634 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
2635 |
)
|
2636 |
outputs = model.generate(
|
2637 |
-
text=["
|
2638 |
-
max_length=64,
|
2639 |
)
|
2640 |
print(outputs.shape, outputs)
|
2641 |
```
|
|
|
2630 |
# load in int8 on CUDA
|
2631 |
model_name_or_path=model_name,
|
2632 |
device="cuda",
|
2633 |
+
compute_type="float16",
|
2634 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
2635 |
)
|
2636 |
outputs = model.generate(
|
2637 |
+
text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
|
|
|
2638 |
)
|
2639 |
print(outputs.shape, outputs)
|
2640 |
```
|