michaelfeil commited on
Commit
1ee3243
1 Parent(s): fcb3f9e

Upload sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2 ctranslate fp16 weights

Browse files
Files changed (2) hide show
  1. README.md +2 -3
  2. tokenizer.json +0 -0
README.md CHANGED
@@ -38,12 +38,11 @@ model = EncoderCT2fromHfHub(
38
  # load in int8 on CUDA
39
  model_name_or_path=model_name,
40
  device="cuda",
41
- compute_type="int8_float16",
42
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
43
  )
44
  outputs = model.generate(
45
- text=["def fibonnaci(", "User: How are you doing? Bot:"],
46
- max_length=64,
47
  )
48
  print(outputs.shape, outputs)
49
  ```
 
38
  # load in int8 on CUDA
39
  model_name_or_path=model_name,
40
  device="cuda",
41
+ compute_type="float16",
42
  # tokenizer=AutoTokenizer.from_pretrained("{ORG}/{NAME}")
43
  )
44
  outputs = model.generate(
45
+ text=["I like soccer", "I like tennis", "The eiffel tower is in Paris"],
 
46
  )
47
  print(outputs.shape, outputs)
48
  ```
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff