michaelfeil commited on
Commit
9e910dc
·
1 Parent(s): d1c73ed

Upload intfloat/e5-large-v2 ctranslate fp16 weights

Browse files
Files changed (1) hide show
  1. README.md +2 -3
README.md CHANGED
@@ -2630,12 +2630,11 @@ model = EncoderCT2fromHfHub(
2630
  # load in int8 on CUDA
2631
  model_name_or_path=model_name,
2632
  device="cuda",
2633
- compute_type="int8_float16",
2634
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
2635
  )
2636
  outputs = model.generate(
2637
- text=["def fibonnaci(", "User: How are you doing? Bot:"],
2638
- max_length=64,
2639
  )
2640
  print(outputs.shape, outputs)
2641
  ```
 
2630
  # load in int8 on CUDA
2631
  model_name_or_path=model_name,
2632
  device="cuda",
2633
+ compute_type="float16",
2634
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
2635
  )
2636
  outputs = model.generate(
2637
+ text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
 
2638
  )
2639
  print(outputs.shape, outputs)
2640
  ```