michaelfeil
commited on
Commit
·
262cea7
1
Parent(s):
1f7309c
Upload intfloat/e5-small-v2 ctranslate fp16 weights
Browse files
README.md
CHANGED
@@ -2626,20 +2626,7 @@ from transformers import AutoTokenizer
|
|
2626 |
|
2627 |
model_name = "michaelfeil/ct2fast-e5-small-v2"
|
2628 |
|
2629 |
-
|
2630 |
-
model = GeneratorCT2fromHfHub(
|
2631 |
-
# load in int8 on CUDA
|
2632 |
-
model_name_or_path=model_name,
|
2633 |
-
device="cuda",
|
2634 |
-
compute_type="int8_float16",
|
2635 |
-
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
2636 |
-
)
|
2637 |
-
outputs = model.generate(
|
2638 |
-
text=["def fibonnaci(", "User: How are you doing? Bot:"],
|
2639 |
-
max_length=64,
|
2640 |
-
include_prompt_in_result=False
|
2641 |
-
)
|
2642 |
-
print(outputs)
|
2643 |
```
|
2644 |
|
2645 |
# Licence and other remarks:
|
|
|
2626 |
|
2627 |
model_name = "michaelfeil/ct2fast-e5-small-v2"
|
2628 |
|
2629 |
+
encoder-only
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2630 |
```
|
2631 |
|
2632 |
# Licence and other remarks:
|