jordimas commited on
Commit
5f8ccac
1 Parent(s): de1acd7

Update 2024-08-30 model

Browse files
Files changed (5) hide show
  1. README.md +2 -2
  2. config.json +8 -1
  3. model.bin +2 -2
  4. model_description.txt +6 -6
  5. sp_m.model +2 -2
README.md CHANGED
@@ -50,8 +50,8 @@ print(tokenizer.detokenize(translated[0][0]['tokens']))
50
 
51
  | testset | BLEU |
52
  |---------------------------------------|-------|
53
- | test dataset (from train/dev/test) | 36.2 |
54
- | Flores200 dataset | 24.5 |
55
 
56
  ## Additional information
57
  * https://github.com/Softcatala/nmt-models
 
50
 
51
  | testset | BLEU |
52
  |---------------------------------------|-------|
53
+ | test dataset (from train/dev/test) | 38.3 |
54
+ | Flores200 dataset | 25.1 |
55
 
56
  ## Additional information
57
  * https://github.com/Softcatala/nmt-models
config.json CHANGED
@@ -1,2 +1,9 @@
1
  {
2
- }
 
 
 
 
 
 
 
 
1
  {
2
+ "add_source_bos": false,
3
+ "add_source_eos": false,
4
+ "bos_token": "<s>",
5
+ "decoder_start_token": "<s>",
6
+ "eos_token": "</s>",
7
+ "layer_norm_epsilon": null,
8
+ "unk_token": "<unk>"
9
+ }
model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc3f0990763e7f2e6f41896c9c3cfcc20f14c8a613be41f34c5b9cead48fa6eb
3
- size 70727761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2d178173374dfacc0f7ea160371f2f5ac612a481779d8e4d6fc5ef6f0c91e0b
3
+ size 70727741
model_description.txt CHANGED
@@ -1,9 +1,9 @@
1
  Model description: cat-ita
2
- Date: 2022-11-15
3
- TF version 2.10.0, OpenNMT version 2.29.1, CTranslate2 version 2.24.0
4
  Test data set
5
- BLEU|nrefs:1|case:mixed|eff:no|tok:13a|smooth:exp|version:2.1.0 = 36.2 64.1/42.4/30.7/22.7 (BP = 0.974 ratio = 0.975 hyp_len = 139207 ref_len = 142832)
6
- chrF2|nrefs:1|case:mixed|eff:yes|nc:6|nw:0|space:no|version:2.1.0 = 62.9
7
  Flores data set
8
- BLEU|nrefs:1|case:mixed|eff:no|tok:13a|smooth:exp|version:2.1.0 = 24.5 58.1/32.3/19.4/12.0 (BP = 0.952 ratio = 0.953 hyp_len = 26034 ref_len = 27306)
9
- chrF2|nrefs:1|case:mixed|eff:yes|nc:6|nw:0|space:no|version:2.1.0 = 54.6
 
1
  Model description: cat-ita
2
+ Date: 2024-08-30
3
+ TF version 2.10.0, OpenNMT version 2.29.1, CTranslate2 version 3.22.0
4
  Test data set
5
+ BLEU|nrefs:1|bs:1000|seed:12345|case:mixed|eff:no|tok:13a|smooth:exp|version:2.1.0 = 38.3 (μ = 38.3 ± 0.6) 66.0/44.9/33.0/24.7 (BP = 0.972 ratio = 0.972 hyp_len = 171543 ref_len = 176440)
6
+ chrF2|nrefs:1|bs:1000|seed:12345|case:mixed|eff:yes|nc:6|nw:0|space:no|version:2.1.0 = 64.2 (μ = 64.2 ± 0.5)
7
  Flores data set
8
+ BLEU|nrefs:1|bs:1000|seed:12345|case:mixed|eff:no|tok:13a|smooth:exp|version:2.1.0 = 25.1 (μ = 25.1 ± 0.9) 58.5/32.8/20.0/12.3 (BP = 0.957 ratio = 0.958 hyp_len = 26150 ref_len = 27306)
9
+ chrF2|nrefs:1|bs:1000|seed:12345|case:mixed|eff:yes|nc:6|nw:0|space:no|version:2.1.0 = 55.2 (μ = 55.2 ± 0.6)
sp_m.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17adbdc0d9f2593177a7274e1d928828fff2ebb17d488355b328d4e707a47d47
3
- size 1167983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ceeec9cb66dcd10292dfcf80c2dbedf25fe427722b84845a6b2a58032254da
3
+ size 1161765