michaelfeil commited on
Commit
262cea7
·
1 Parent(s): 1f7309c

Upload intfloat/e5-small-v2 ctranslate fp16 weights

Browse files
Files changed (1) hide show
  1. README.md +1 -14
README.md CHANGED
@@ -2626,20 +2626,7 @@ from transformers import AutoTokenizer
2626
 
2627
  model_name = "michaelfeil/ct2fast-e5-small-v2"
2628
 
2629
- # use either TranslatorCT2fromHfHub or GeneratorCT2fromHfHub here, depending on model.
2630
- model = GeneratorCT2fromHfHub(
2631
- # load in int8 on CUDA
2632
- model_name_or_path=model_name,
2633
- device="cuda",
2634
- compute_type="int8_float16",
2635
- # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
2636
- )
2637
- outputs = model.generate(
2638
- text=["def fibonnaci(", "User: How are you doing? Bot:"],
2639
- max_length=64,
2640
- include_prompt_in_result=False
2641
- )
2642
- print(outputs)
2643
  ```
2644
 
2645
  # Licence and other remarks:
 
2626
 
2627
  model_name = "michaelfeil/ct2fast-e5-small-v2"
2628
 
2629
+ encoder-only
 
 
 
 
 
 
 
 
 
 
 
 
 
2630
  ```
2631
 
2632
  # Licence and other remarks: