michaelfeil commited on
Commit
b795d29
1 Parent(s): 33005d6

Upload sentence-transformers/all-MiniLM-L6-v2 ctranslate fp16 weights

Browse files
Files changed (1) hide show
  1. README.md +2 -3
README.md CHANGED
@@ -60,12 +60,11 @@ model = EncoderCT2fromHfHub(
60
  # load in int8 on CUDA
61
  model_name_or_path=model_name,
62
  device="cuda",
63
- compute_type="int8_float16",
64
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
65
  )
66
  outputs = model.generate(
67
- text=["def fibonnaci(", "User: How are you doing? Bot:"],
68
- max_length=64,
69
  )
70
  print(outputs.shape, outputs)
71
  ```
 
60
  # load in int8 on CUDA
61
  model_name_or_path=model_name,
62
  device="cuda",
63
+ compute_type="float16",
64
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
65
  )
66
  outputs = model.generate(
67
+ text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
 
68
  )
69
  print(outputs.shape, outputs)
70
  ```