michaelfeil commited on
Commit
55bcef1
1 Parent(s): 38a984d

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -1,34 +1,9 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
  *.tflite filter=lfs diff=lfs merge=lfs -text
29
- *.tgz filter=lfs diff=lfs merge=lfs -text
30
- *.wasm filter=lfs diff=lfs merge=lfs -text
31
- *.xz filter=lfs diff=lfs merge=lfs -text
32
- *.zip filter=lfs diff=lfs merge=lfs -text
33
- *.zst filter=lfs diff=lfs merge=lfs -text
34
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
+ *.bin.* filter=lfs diff=lfs merge=lfs -text
2
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
 
 
 
 
4
  *.h5 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  *.tflite filter=lfs diff=lfs merge=lfs -text
6
+ *.tar.gz filter=lfs diff=lfs merge=lfs -text
7
+ *.ot filter=lfs diff=lfs merge=lfs -text
8
+ *.onnx filter=lfs diff=lfs merge=lfs -text
9
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
 
 
README.md ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - ctranslate2
4
+ - translation
5
+ license: apache-2.0
6
+ ---
7
+ # # Fast-Inference with Ctranslate2
8
+ Speedup inference by 2x-8x using int8 inference in C++
9
+
10
+ quantized version of [Helsinki-NLP/opus-mt-en-fr](https://huggingface.co/Helsinki-NLP/opus-mt-en-fr)
11
+ ```bash
12
+ pip install hf-hub-ctranslate2>=1.0.0 ctranslate2>=3.13.0
13
+ ```
14
+ Converted using
15
+ ```
16
+ ct2-transformers-converter --model Helsinki-NLP/opus-mt-en-fr --output_dir /home/michael/tmp-ct2fast-opus-mt-en-fr --force --copy_files README.md generation_config.json tokenizer_config.json vocab.json source.spm .gitattributes target.spm --quantization float16
17
+ ```
18
+
19
+ Checkpoint compatible to [ctranslate2](https://github.com/OpenNMT/CTranslate2) and [hf-hub-ctranslate2](https://github.com/michaelfeil/hf-hub-ctranslate2)
20
+ - `compute_type=int8_float16` for `device="cuda"`
21
+ - `compute_type=int8` for `device="cpu"`
22
+
23
+ ```python
24
+ from hf_hub_ctranslate2 import TranslatorCT2fromHfHub, GeneratorCT2fromHfHub
25
+ from transformers import AutoTokenizer
26
+
27
+ model_name = "michaelfeil/ct2fast-opus-mt-en-fr"
28
+ # use either TranslatorCT2fromHfHub or GeneratorCT2fromHfHub here, depending on model.
29
+ model = TranslatorCT2fromHfHub(
30
+ # load in int8 on CUDA
31
+ model_name_or_path=model_name,
32
+ device="cuda",
33
+ compute_type="int8_float16",
34
+ tokenizer=AutoTokenizer.from_pretrained("Helsinki-NLP/opus-mt-en-fr")
35
+ )
36
+ outputs = model.generate(
37
+ text=["How do you call a fast Flan-ingo?", "User: How are you doing?"],
38
+ )
39
+ print(outputs)
40
+ ```
41
+
42
+ # Licence and other remarks:
43
+ This is just a quantized version. Licence conditions are intended to be idential to original huggingface repo.
44
+
45
+ # Original description
46
+
47
+
48
+ ### opus-mt-en-fr
49
+
50
+ * source languages: en
51
+ * target languages: fr
52
+ * OPUS readme: [en-fr](https://github.com/Helsinki-NLP/OPUS-MT-train/blob/master/models/en-fr/README.md)
53
+
54
+ * dataset: opus
55
+ * model: transformer-align
56
+ * pre-processing: normalization + SentencePiece
57
+ * download original weights: [opus-2020-02-26.zip](https://object.pouta.csc.fi/OPUS-MT-models/en-fr/opus-2020-02-26.zip)
58
+ * test set translations: [opus-2020-02-26.test.txt](https://object.pouta.csc.fi/OPUS-MT-models/en-fr/opus-2020-02-26.test.txt)
59
+ * test set scores: [opus-2020-02-26.eval.txt](https://object.pouta.csc.fi/OPUS-MT-models/en-fr/opus-2020-02-26.eval.txt)
60
+
61
+ ## Benchmarks
62
+
63
+ | testset | BLEU | chr-F |
64
+ |-----------------------|-------|-------|
65
+ | newsdiscussdev2015-enfr.en.fr | 33.8 | 0.602 |
66
+ | newsdiscusstest2015-enfr.en.fr | 40.0 | 0.643 |
67
+ | newssyscomb2009.en.fr | 29.8 | 0.584 |
68
+ | news-test2008.en.fr | 27.5 | 0.554 |
69
+ | newstest2009.en.fr | 29.4 | 0.577 |
70
+ | newstest2010.en.fr | 32.7 | 0.596 |
71
+ | newstest2011.en.fr | 34.3 | 0.611 |
72
+ | newstest2012.en.fr | 31.8 | 0.592 |
73
+ | newstest2013.en.fr | 33.2 | 0.589 |
74
+ | Tatoeba.en.fr | 50.5 | 0.672 |
75
+
config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_source_bos": false,
3
+ "add_source_eos": false,
4
+ "bos_token": "<s>",
5
+ "decoder_start_token": "</s>",
6
+ "eos_token": "</s>",
7
+ "unk_token": "<unk>"
8
+ }
generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bad_words_ids": [
4
+ [
5
+ 59513
6
+ ]
7
+ ],
8
+ "bos_token_id": 0,
9
+ "decoder_start_token_id": 59513,
10
+ "eos_token_id": 0,
11
+ "forced_eos_token_id": 0,
12
+ "max_length": 512,
13
+ "num_beams": 4,
14
+ "pad_token_id": 59513,
15
+ "transformers_version": "4.27.0.dev0"
16
+ }
model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:636d926880a6e6e4b773403a5991b50d4dfdfabe49a230e148676a05e99f2bec
3
+ size 149872839
shared_vocabulary.txt ADDED
The diff for this file is too large to render. See raw diff
 
source.spm ADDED
Binary file (778 kB). View file
 
target.spm ADDED
Binary file (802 kB). View file
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"target_lang": "fr", "source_lang": "en"}
vocab.json ADDED
The diff for this file is too large to render. See raw diff