michaelfeil
commited on
Commit
•
b795d29
1
Parent(s):
33005d6
Upload sentence-transformers/all-MiniLM-L6-v2 ctranslate fp16 weights
Browse files
README.md
CHANGED
@@ -60,12 +60,11 @@ model = EncoderCT2fromHfHub(
|
|
60 |
# load in int8 on CUDA
|
61 |
model_name_or_path=model_name,
|
62 |
device="cuda",
|
63 |
-
compute_type="
|
64 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
65 |
)
|
66 |
outputs = model.generate(
|
67 |
-
text=["
|
68 |
-
max_length=64,
|
69 |
)
|
70 |
print(outputs.shape, outputs)
|
71 |
```
|
|
|
60 |
# load in int8 on CUDA
|
61 |
model_name_or_path=model_name,
|
62 |
device="cuda",
|
63 |
+
compute_type="float16",
|
64 |
# tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
|
65 |
)
|
66 |
outputs = model.generate(
|
67 |
+
text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
|
|
|
68 |
)
|
69 |
print(outputs.shape, outputs)
|
70 |
```
|