michaelfeil commited on
Commit
3d7749e
1 Parent(s): 6614ed4

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -1
README.md CHANGED
@@ -1,5 +1,7 @@
1
  ---
2
  license: apache-2.0
 
 
3
  ---
4
  # Fast-Inference with Ctranslate2
5
  Speedup inference by 2x-8x using int8 inference in C++
@@ -18,7 +20,7 @@ Checkpoint compatible to [ctranslate2](https://github.com/OpenNMT/CTranslate2) a
18
  from hf_hub_ctranslate2 import TranslatorCT2fromHfHub, GeneratorCT2fromHfHub
19
 
20
  model_name = "michaelfeil/ct2fast-flan-alpaca-base"
21
- model = GeneratorCT2fromHfHub(
22
  # load in int8 on CUDA
23
  model_name_or_path=model_name,
24
  device="cuda",
 
1
  ---
2
  license: apache-2.0
3
+ tags:
4
+ - ctranslate2
5
  ---
6
  # Fast-Inference with Ctranslate2
7
  Speedup inference by 2x-8x using int8 inference in C++
 
20
  from hf_hub_ctranslate2 import TranslatorCT2fromHfHub, GeneratorCT2fromHfHub
21
 
22
  model_name = "michaelfeil/ct2fast-flan-alpaca-base"
23
+ model = TranslatorCT2fromHfHub(
24
  # load in int8 on CUDA
25
  model_name_or_path=model_name,
26
  device="cuda",