Initial commit
Browse files- .gitattributes +1 -0
- README.md +0 -0
- benchmark_results.txt +313 -0
- benchmark_translations.zip +0 -0
- config.json +41 -0
- generation_config.json +16 -0
- model.safetensors +3 -0
- pytorch_model.bin +3 -0
- source.spm +3 -0
- special_tokens_map.json +1 -0
- target.spm +3 -0
- tokenizer_config.json +1 -0
- vocab.json +0 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
*.spm filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
The diff for this file is too large to render.
See raw diff
|
|
benchmark_results.txt
ADDED
@@ -0,0 +1,313 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
multi-multi tatoeba-test-v2020-07-28-v2023-09-26 0.69536 52.8 10000 84956
|
2 |
+
ast-deu flores101-devtest 0.53243 24.2 1012 25094
|
3 |
+
ast-eng flores101-devtest 0.61235 36.0 1012 24721
|
4 |
+
ast-fra flores101-devtest 0.56687 31.2 1012 28343
|
5 |
+
ast-por flores101-devtest 0.57033 30.6 1012 26519
|
6 |
+
ast-spa flores101-devtest 0.49637 21.2 1012 29199
|
7 |
+
cat-fra flores101-devtest 0.63271 38.4 1012 28343
|
8 |
+
fra-deu flores101-devtest 0.58433 28.9 1012 25094
|
9 |
+
fra-eng flores101-devtest 0.67826 43.3 1012 24721
|
10 |
+
glg-deu flores101-devtest 0.56897 27.1 1012 25094
|
11 |
+
glg-spa flores101-devtest 0.53183 24.2 1012 29199
|
12 |
+
ita-por flores101-devtest 0.57961 28.4 1012 26519
|
13 |
+
kea-deu flores101-devtest 0.48105 18.3 1012 25094
|
14 |
+
kea-eng flores101-devtest 0.60362 35.0 1012 24721
|
15 |
+
kea-por flores101-devtest 0.57808 29.0 1012 26519
|
16 |
+
kea-spa flores101-devtest 0.46648 17.6 1012 29199
|
17 |
+
oci-deu flores101-devtest 0.57391 28.0 1012 25094
|
18 |
+
oci-eng flores101-devtest 0.72351 49.4 1012 24721
|
19 |
+
por-eng flores101-devtest 0.70724 47.4 1012 24721
|
20 |
+
por-fra flores101-devtest 0.64103 39.2 1012 28343
|
21 |
+
por-spa flores101-devtest 0.53268 25.0 1012 29199
|
22 |
+
ron-deu flores101-devtest 0.57980 28.1 1012 25094
|
23 |
+
ron-eng flores101-devtest 0.67583 41.6 1012 24721
|
24 |
+
ron-spa flores101-devtest 0.53082 24.3 1012 29199
|
25 |
+
spa-fra flores101-devtest 0.57039 27.1 1012 28343
|
26 |
+
spa-por flores101-devtest 0.55607 25.0 1012 26519
|
27 |
+
ast-deu flores200-devtest 0.53776 24.8 1012 25094
|
28 |
+
ast-eng flores200-devtest 0.61482 36.8 1012 24721
|
29 |
+
ast-fra flores200-devtest 0.56504 31.3 1012 28343
|
30 |
+
ast-por flores200-devtest 0.57158 31.1 1012 26519
|
31 |
+
ast-spa flores200-devtest 0.49579 21.2 1012 29199
|
32 |
+
cat-deu flores200-devtest 0.58203 29.2 1012 25094
|
33 |
+
cat-eng flores200-devtest 0.69165 44.6 1012 24721
|
34 |
+
cat-fra flores200-devtest 0.63612 38.9 1012 28343
|
35 |
+
cat-por flores200-devtest 0.62911 37.7 1012 26519
|
36 |
+
cat-spa flores200-devtest 0.53320 24.6 1012 29199
|
37 |
+
fra-deu flores200-devtest 0.58592 29.1 1012 25094
|
38 |
+
fra-eng flores200-devtest 0.68067 43.8 1012 24721
|
39 |
+
fra-por flores200-devtest 0.62388 37.0 1012 26519
|
40 |
+
fra-spa flores200-devtest 0.52983 24.4 1012 29199
|
41 |
+
fur-deu flores200-devtest 0.51969 21.8 1012 25094
|
42 |
+
fur-eng flores200-devtest 0.60793 34.3 1012 24721
|
43 |
+
fur-fra flores200-devtest 0.56989 30.0 1012 28343
|
44 |
+
fur-por flores200-devtest 0.56207 29.3 1012 26519
|
45 |
+
fur-spa flores200-devtest 0.48436 20.0 1012 29199
|
46 |
+
glg-deu flores200-devtest 0.57369 27.7 1012 25094
|
47 |
+
glg-eng flores200-devtest 0.66358 40.0 1012 24721
|
48 |
+
glg-fra flores200-devtest 0.62487 36.5 1012 28343
|
49 |
+
glg-por flores200-devtest 0.60267 32.7 1012 26519
|
50 |
+
glg-spa flores200-devtest 0.53227 24.3 1012 29199
|
51 |
+
hat-deu flores200-devtest 0.49916 19.1 1012 25094
|
52 |
+
hat-eng flores200-devtest 0.59656 32.5 1012 24721
|
53 |
+
hat-fra flores200-devtest 0.61574 35.4 1012 28343
|
54 |
+
hat-por flores200-devtest 0.55195 27.7 1012 26519
|
55 |
+
hat-spa flores200-devtest 0.47382 18.4 1012 29199
|
56 |
+
ita-deu flores200-devtest 0.55779 24.1 1012 25094
|
57 |
+
ita-eng flores200-devtest 0.61563 32.2 1012 24721
|
58 |
+
ita-fra flores200-devtest 0.60210 31.2 1012 28343
|
59 |
+
ita-por flores200-devtest 0.58279 28.8 1012 26519
|
60 |
+
ita-spa flores200-devtest 0.52348 23.2 1012 29199
|
61 |
+
kea-deu flores200-devtest 0.49089 19.3 1012 25094
|
62 |
+
kea-eng flores200-devtest 0.60553 35.5 1012 24721
|
63 |
+
kea-fra flores200-devtest 0.54027 26.6 1012 28343
|
64 |
+
kea-por flores200-devtest 0.57696 28.9 1012 26519
|
65 |
+
kea-spa flores200-devtest 0.46974 18.0 1012 29199
|
66 |
+
lij-deu flores200-devtest 0.51695 22.7 1012 25094
|
67 |
+
lij-eng flores200-devtest 0.62347 36.2 1012 24721
|
68 |
+
lij-fra flores200-devtest 0.57498 31.4 1012 28343
|
69 |
+
lij-por flores200-devtest 0.56183 29.4 1012 26519
|
70 |
+
lij-spa flores200-devtest 0.48038 20.0 1012 29199
|
71 |
+
lmo-deu flores200-devtest 0.45516 15.4 1012 25094
|
72 |
+
lmo-eng flores200-devtest 0.53540 25.5 1012 24721
|
73 |
+
lmo-fra flores200-devtest 0.50076 22.2 1012 28343
|
74 |
+
lmo-por flores200-devtest 0.50134 22.9 1012 26519
|
75 |
+
lmo-spa flores200-devtest 0.44053 16.2 1012 29199
|
76 |
+
oci-deu flores200-devtest 0.57822 28.7 1012 25094
|
77 |
+
oci-eng flores200-devtest 0.73030 50.7 1012 24721
|
78 |
+
oci-fra flores200-devtest 0.64900 39.7 1012 28343
|
79 |
+
oci-por flores200-devtest 0.63318 36.9 1012 26519
|
80 |
+
oci-spa flores200-devtest 0.52269 22.9 1012 29199
|
81 |
+
pap-deu flores200-devtest 0.53166 23.2 1012 25094
|
82 |
+
pap-eng flores200-devtest 0.68541 44.6 1012 24721
|
83 |
+
pap-fra flores200-devtest 0.57224 30.5 1012 28343
|
84 |
+
pap-por flores200-devtest 0.59064 33.2 1012 26519
|
85 |
+
pap-spa flores200-devtest 0.49601 21.7 1012 29199
|
86 |
+
por-deu flores200-devtest 0.59047 30.3 1012 25094
|
87 |
+
por-eng flores200-devtest 0.71096 48.0 1012 24721
|
88 |
+
por-fra flores200-devtest 0.64555 40.1 1012 28343
|
89 |
+
por-spa flores200-devtest 0.53400 25.1 1012 29199
|
90 |
+
ron-deu flores200-devtest 0.58428 28.7 1012 25094
|
91 |
+
ron-eng flores200-devtest 0.67719 41.8 1012 24721
|
92 |
+
ron-fra flores200-devtest 0.63678 37.6 1012 28343
|
93 |
+
ron-por flores200-devtest 0.62371 36.1 1012 26519
|
94 |
+
ron-spa flores200-devtest 0.53150 24.5 1012 29199
|
95 |
+
scn-deu flores200-devtest 0.48102 19.2 1012 25094
|
96 |
+
scn-eng flores200-devtest 0.55782 29.6 1012 24721
|
97 |
+
scn-fra flores200-devtest 0.52773 26.1 1012 28343
|
98 |
+
scn-por flores200-devtest 0.51894 25.2 1012 26519
|
99 |
+
scn-spa flores200-devtest 0.45724 17.9 1012 29199
|
100 |
+
spa-deu flores200-devtest 0.53451 21.5 1012 25094
|
101 |
+
spa-eng flores200-devtest 0.58896 28.5 1012 24721
|
102 |
+
spa-fra flores200-devtest 0.57406 27.6 1012 28343
|
103 |
+
spa-por flores200-devtest 0.55749 25.2 1012 26519
|
104 |
+
srd-deu flores200-devtest 0.49238 19.9 1012 25094
|
105 |
+
srd-eng flores200-devtest 0.59392 34.2 1012 24721
|
106 |
+
srd-fra flores200-devtest 0.54003 27.6 1012 28343
|
107 |
+
srd-por flores200-devtest 0.53842 27.9 1012 26519
|
108 |
+
srd-spa flores200-devtest 0.46002 18.2 1012 29199
|
109 |
+
vec-deu flores200-devtest 0.48795 19.3 1012 25094
|
110 |
+
vec-eng flores200-devtest 0.56840 30.7 1012 24721
|
111 |
+
vec-fra flores200-devtest 0.54164 27.3 1012 28343
|
112 |
+
vec-por flores200-devtest 0.53482 26.2 1012 26519
|
113 |
+
vec-spa flores200-devtest 0.46588 18.4 1012 29199
|
114 |
+
fra-deu generaltest2022 0.66476 42.4 2006 37696
|
115 |
+
fra-deu multi30k_test_2016_flickr 0.61797 32.6 1000 12106
|
116 |
+
fra-eng multi30k_test_2016_flickr 0.66271 47.2 1000 12955
|
117 |
+
fra-deu multi30k_test_2017_flickr 0.59701 29.4 1000 10755
|
118 |
+
fra-eng multi30k_test_2017_flickr 0.69422 50.3 1000 11374
|
119 |
+
fra-deu multi30k_test_2017_mscoco 0.55509 25.7 461 5158
|
120 |
+
fra-eng multi30k_test_2017_mscoco 0.67791 48.7 461 5231
|
121 |
+
fra-deu multi30k_test_2018_flickr 0.55237 24.0 1071 13703
|
122 |
+
fra-eng multi30k_test_2018_flickr 0.64722 43.8 1071 14689
|
123 |
+
fra-eng newsdiscusstest2015 0.61385 38.4 1500 26982
|
124 |
+
fra-deu newssyscomb2009 0.53530 23.7 502 11271
|
125 |
+
fra-eng newssyscomb2009 0.57297 31.3 502 11818
|
126 |
+
fra-spa newssyscomb2009 0.60233 34.1 502 12503
|
127 |
+
ita-deu newssyscomb2009 0.53590 22.4 502 11271
|
128 |
+
ita-eng newssyscomb2009 0.59976 34.8 502 11818
|
129 |
+
ita-fra newssyscomb2009 0.61232 33.5 502 12331
|
130 |
+
ita-spa newssyscomb2009 0.60782 35.3 502 12503
|
131 |
+
spa-deu newssyscomb2009 0.52853 21.8 502 11271
|
132 |
+
spa-eng newssyscomb2009 0.57347 31.0 502 11818
|
133 |
+
spa-fra newssyscomb2009 0.61436 34.3 502 12331
|
134 |
+
fra-deu newstest2008 0.53180 22.9 2051 47447
|
135 |
+
fra-eng newstest2008 0.54379 26.5 2051 49380
|
136 |
+
fra-spa newstest2008 0.58804 33.1 2051 52586
|
137 |
+
spa-deu newstest2008 0.52221 21.6 2051 47447
|
138 |
+
spa-eng newstest2008 0.55331 27.9 2051 49380
|
139 |
+
spa-fra newstest2008 0.58769 32.0 2051 52685
|
140 |
+
fra-deu newstest2009 0.52771 22.5 2525 62816
|
141 |
+
fra-eng newstest2009 0.56679 30.2 2525 65399
|
142 |
+
fra-spa newstest2009 0.58921 32.1 2525 68111
|
143 |
+
ita-deu newstest2009 0.53022 22.8 2525 62816
|
144 |
+
ita-eng newstest2009 0.59309 33.8 2525 65399
|
145 |
+
ita-fra newstest2009 0.59309 32.0 2525 69263
|
146 |
+
ita-spa newstest2009 0.59760 33.5 2525 68111
|
147 |
+
spa-deu newstest2009 0.52822 22.3 2525 62816
|
148 |
+
spa-eng newstest2009 0.56989 30.4 2525 65399
|
149 |
+
spa-fra newstest2009 0.59150 32.2 2525 69263
|
150 |
+
fra-deu newstest2010 0.53765 24.0 2489 61503
|
151 |
+
fra-eng newstest2010 0.59251 32.6 2489 61711
|
152 |
+
fra-spa newstest2010 0.62480 37.6 2489 65480
|
153 |
+
spa-deu newstest2010 0.55161 26.0 2489 61503
|
154 |
+
spa-eng newstest2010 0.61562 36.3 2489 61711
|
155 |
+
spa-fra newstest2010 0.62021 35.7 2489 66022
|
156 |
+
fra-deu newstest2011 0.53025 23.1 3003 72981
|
157 |
+
fra-eng newstest2011 0.59636 32.9 3003 74681
|
158 |
+
fra-spa newstest2011 0.63203 39.9 3003 79476
|
159 |
+
spa-deu newstest2011 0.52934 23.3 3003 72981
|
160 |
+
spa-eng newstest2011 0.59606 33.8 3003 74681
|
161 |
+
spa-fra newstest2011 0.61079 34.9 3003 80626
|
162 |
+
fra-deu newstest2012 0.52957 24.0 3003 72886
|
163 |
+
fra-eng newstest2012 0.59352 33.6 3003 72812
|
164 |
+
fra-spa newstest2012 0.62641 39.2 3003 79006
|
165 |
+
spa-deu newstest2012 0.53519 24.6 3003 72886
|
166 |
+
spa-eng newstest2012 0.62284 37.4 3003 72812
|
167 |
+
spa-fra newstest2012 0.61076 33.8 3003 78011
|
168 |
+
fra-deu newstest2013 0.54167 25.4 3000 63737
|
169 |
+
fra-eng newstest2013 0.59236 34.0 3000 64505
|
170 |
+
fra-spa newstest2013 0.59347 34.9 3000 70528
|
171 |
+
spa-deu newstest2013 0.55130 26.3 3000 63737
|
172 |
+
spa-eng newstest2013 0.60681 34.6 3000 64505
|
173 |
+
spa-fra newstest2013 0.59816 33.2 3000 70037
|
174 |
+
fra-eng newstest2014 0.63499 37.9 3003 70708
|
175 |
+
ron-eng newstest2016 0.63996 39.5 1999 47562
|
176 |
+
fra-deu newstest2019 0.60468 28.6 1701 36446
|
177 |
+
fra-deu newstest2020 0.61401 28.8 1619 30265
|
178 |
+
fra-deu newstest2021 0.65950 39.5 1026 26077
|
179 |
+
cat-deu ntrex128 0.54096 24.0 1997 48761
|
180 |
+
cat-eng ntrex128 0.63516 36.5 1997 47673
|
181 |
+
cat-fra ntrex128 0.56385 28.1 1997 53481
|
182 |
+
cat-por ntrex128 0.56246 28.7 1997 51631
|
183 |
+
cat-spa ntrex128 0.61311 35.8 1997 54107
|
184 |
+
fra-deu ntrex128 0.53059 23.4 1997 48761
|
185 |
+
fra-eng ntrex128 0.61285 34.7 1997 47673
|
186 |
+
fra-por ntrex128 0.54075 25.8 1997 51631
|
187 |
+
fra-spa ntrex128 0.56863 30.6 1997 54107
|
188 |
+
glg-deu ntrex128 0.53724 23.6 1997 48761
|
189 |
+
glg-eng ntrex128 0.64481 38.7 1997 47673
|
190 |
+
glg-fra ntrex128 0.55856 27.8 1997 53481
|
191 |
+
glg-por ntrex128 0.56322 28.7 1997 51631
|
192 |
+
glg-spa ntrex128 0.61794 36.8 1997 54107
|
193 |
+
ita-deu ntrex128 0.54678 25.0 1997 48761
|
194 |
+
ita-eng ntrex128 0.64636 39.2 1997 47673
|
195 |
+
ita-fra ntrex128 0.57428 30.0 1997 53481
|
196 |
+
ita-por ntrex128 0.56858 29.7 1997 51631
|
197 |
+
ita-spa ntrex128 0.58886 33.0 1997 54107
|
198 |
+
por-deu ntrex128 0.54833 24.6 1997 48761
|
199 |
+
por-eng ntrex128 0.65223 39.7 1997 47673
|
200 |
+
por-fra ntrex128 0.56793 28.9 1997 53481
|
201 |
+
por-spa ntrex128 0.59218 33.8 1997 54107
|
202 |
+
ron-deu ntrex128 0.53249 22.4 1997 48761
|
203 |
+
ron-eng ntrex128 0.61807 33.8 1997 47673
|
204 |
+
ron-fra ntrex128 0.55575 26.4 1997 53481
|
205 |
+
ron-por ntrex128 0.55086 27.2 1997 51631
|
206 |
+
ron-spa ntrex128 0.57787 31.9 1997 54107
|
207 |
+
spa-deu ntrex128 0.54309 23.8 1997 48761
|
208 |
+
spa-eng ntrex128 0.64416 37.4 1997 47673
|
209 |
+
spa-fra ntrex128 0.57320 29.4 1997 53481
|
210 |
+
spa-por ntrex128 0.56751 29.0 1997 51631
|
211 |
+
cat-fra tatoeba-test-v2020-07-28 0.71145 53.4 686 5517
|
212 |
+
cat-por tatoeba-test-v2020-07-28 0.75553 58.2 729 5847
|
213 |
+
fra-deu tatoeba-test-v2020-07-28 0.67550 49.0 10000 80271
|
214 |
+
fra-por tatoeba-test-v2020-07-28 0.70309 51.3 10000 71341
|
215 |
+
lad-eng tatoeba-test-v2020-07-28 0.40440 9.7 629 3456
|
216 |
+
lad-spa tatoeba-test-v2020-07-28 0.52785 17.7 207 1076
|
217 |
+
lad_Latn-eng tatoeba-test-v2020-07-28 0.53006 36.0 582 3200
|
218 |
+
lat-eng tatoeba-test-v2020-07-28 0.42350 24.0 10000 98199
|
219 |
+
lat-fra tatoeba-test-v2020-07-28 5.874 0.0 2917 39174
|
220 |
+
lat-por tatoeba-test-v2020-07-28 0.36214 15.3 5000 64031
|
221 |
+
ron-eng tatoeba-test-v2020-07-28 0.72536 58.1 5000 37125
|
222 |
+
ron-spa tatoeba-test-v2020-07-28 0.73447 57.1 1961 12694
|
223 |
+
spa-deu tatoeba-test-v2020-07-28 0.67420 48.4 10000 81214
|
224 |
+
spa-eng tatoeba-test-v2020-07-28 0.73549 59.3 10000 79376
|
225 |
+
spa-fra tatoeba-test-v2020-07-28 0.72951 56.1 10000 80915
|
226 |
+
spa-por tatoeba-test-v2020-07-28 0.77409 61.2 10000 77911
|
227 |
+
cat-deu tatoeba-test-v2021-03-30 0.66677 48.0 727 5718
|
228 |
+
cat-fra tatoeba-test-v2021-03-30 0.70866 52.8 705 5724
|
229 |
+
fra-deu tatoeba-test-v2021-03-30 0.67931 49.2 11388 91323
|
230 |
+
fra-por tatoeba-test-v2021-03-30 0.70342 51.4 10151 72451
|
231 |
+
fra-spa tatoeba-test-v2021-03-30 0.72033 54.7 10122 77059
|
232 |
+
gcf-fra tatoeba-test-v2021-03-30 0.35546 13.0 1166 6320
|
233 |
+
glg-eng tatoeba-test-v2021-03-30 0.69780 54.6 1020 8470
|
234 |
+
glg-por tatoeba-test-v2021-03-30 0.77610 62.2 438 3138
|
235 |
+
ita-fra tatoeba-test-v2021-03-30 0.77938 63.8 10041 65856
|
236 |
+
lad-deu tatoeba-test-v2021-03-30 0.33457 5.2 229 1222
|
237 |
+
lad_Latn-eng tatoeba-test-v2021-03-30 0.53968 36.5 696 3796
|
238 |
+
lad_Latn-spa tatoeba-test-v2021-03-30 0.62677 45.1 242 1294
|
239 |
+
lat-fra tatoeba-test-v2021-03-30 0.29569 10.0 2917 39174
|
240 |
+
lat-por tatoeba-test-v2021-03-30 0.36236 15.4 5002 64081
|
241 |
+
lat_Latn-por tatoeba-test-v2021-03-30 0.36250 15.4 5001 64073
|
242 |
+
oci-eng tatoeba-test-v2021-03-30 0.41695 23.1 842 5306
|
243 |
+
oci-fra tatoeba-test-v2021-03-30 0.49237 28.6 807 6310
|
244 |
+
pms-eng tatoeba-test-v2021-03-30 0.38613 19.4 270 2061
|
245 |
+
por-eng tatoeba-test-v2021-03-30 0.76355 63.4 11574 87523
|
246 |
+
por-por tatoeba-test-v2021-03-30 0.72833 52.5 2500 19220
|
247 |
+
por-spa tatoeba-test-v2021-03-30 0.79534 64.9 10395 80844
|
248 |
+
ron-eng tatoeba-test-v2021-03-30 0.72627 58.2 10019 74340
|
249 |
+
ron-fra tatoeba-test-v2021-03-30 0.70061 53.2 1952 13478
|
250 |
+
ron-por tatoeba-test-v2021-03-30 0.72601 53.0 715 4807
|
251 |
+
ron-spa tatoeba-test-v2021-03-30 0.73447 57.1 1961 12694
|
252 |
+
spa-deu tatoeba-test-v2021-03-30 0.67447 48.4 10138 82525
|
253 |
+
spa-eng tatoeba-test-v2021-03-30 0.73648 59.5 11940 96122
|
254 |
+
spa-fra tatoeba-test-v2021-03-30 0.73003 56.1 10122 82050
|
255 |
+
spa-por tatoeba-test-v2021-03-30 0.77312 61.1 10395 81022
|
256 |
+
cat-deu tatoeba-test-v2021-08-07 0.66856 47.9 723 5676
|
257 |
+
cat-eng tatoeba-test-v2021-08-07 0.72313 57.9 1631 12627
|
258 |
+
cat-fra tatoeba-test-v2021-08-07 0.71565 53.8 700 5664
|
259 |
+
cat-por tatoeba-test-v2021-08-07 0.75797 58.7 747 6119
|
260 |
+
cat-spa tatoeba-test-v2021-08-07 0.87610 77.7 1534 12094
|
261 |
+
fra-deu tatoeba-test-v2021-08-07 0.68638 50.0 12418 100545
|
262 |
+
fra-eng tatoeba-test-v2021-08-07 0.72664 58.0 12681 101754
|
263 |
+
fra-fra tatoeba-test-v2021-08-07 0.62093 40.6 1000 7757
|
264 |
+
fra-por tatoeba-test-v2021-08-07 0.70764 52.0 10518 77650
|
265 |
+
fra-spa tatoeba-test-v2021-08-07 0.72229 55.0 10294 78406
|
266 |
+
gcf-fra tatoeba-test-v2021-08-07 0.34758 12.7 1164 6309
|
267 |
+
glg-eng tatoeba-test-v2021-08-07 0.70552 55.7 1015 8421
|
268 |
+
glg-por tatoeba-test-v2021-08-07 0.77067 62.1 433 3105
|
269 |
+
glg-spa tatoeba-test-v2021-08-07 0.82795 72.1 2121 17443
|
270 |
+
ita-deu tatoeba-test-v2021-08-07 0.68325 49.4 10094 79762
|
271 |
+
ita-eng tatoeba-test-v2021-08-07 0.81176 70.5 17320 119214
|
272 |
+
ita-fra tatoeba-test-v2021-08-07 0.78299 64.4 10091 66377
|
273 |
+
ita-por tatoeba-test-v2021-08-07 0.74169 55.6 3066 25668
|
274 |
+
ita-spa tatoeba-test-v2021-08-07 0.77673 63.0 5000 34937
|
275 |
+
lad-deu tatoeba-test-v2021-08-07 0.31777 4.6 220 1175
|
276 |
+
lad-eng tatoeba-test-v2021-08-07 0.36847 7.6 768 4184
|
277 |
+
lad-spa tatoeba-test-v2021-08-07 0.37655 6.5 276 1448
|
278 |
+
lad_Latn-eng tatoeba-test-v2021-08-07 0.54247 36.7 672 3665
|
279 |
+
lad_Latn-spa tatoeba-test-v2021-08-07 0.59790 40.4 239 1239
|
280 |
+
lat-deu tatoeba-test-v2021-08-07 0.42548 24.8 2016 13326
|
281 |
+
lat-eng tatoeba-test-v2021-08-07 0.42385 24.3 10298 100152
|
282 |
+
lat-fra tatoeba-test-v2021-08-07 0.29490 10.1 2915 39168
|
283 |
+
lat-por tatoeba-test-v2021-08-07 0.36372 15.6 5001 64039
|
284 |
+
lat-spa tatoeba-test-v2021-08-07 0.45821 25.2 3129 34036
|
285 |
+
lat_Latn-por tatoeba-test-v2021-08-07 0.36386 15.6 5000 64031
|
286 |
+
oci-eng tatoeba-test-v2021-08-07 0.40921 22.4 841 5299
|
287 |
+
oci-fra tatoeba-test-v2021-08-07 0.49044 28.4 806 6302
|
288 |
+
pcd-fra tatoeba-test-v2021-08-07 0.41500 15.0 266 1677
|
289 |
+
pms-eng tatoeba-test-v2021-08-07 0.39308 20.8 269 2059
|
290 |
+
por-deu tatoeba-test-v2021-08-07 0.68379 48.8 10000 81246
|
291 |
+
por-eng tatoeba-test-v2021-08-07 0.77089 64.2 13222 105351
|
292 |
+
por-fra tatoeba-test-v2021-08-07 0.75364 58.7 10518 80459
|
293 |
+
por-por tatoeba-test-v2021-08-07 0.71396 50.3 2500 19220
|
294 |
+
por-spa tatoeba-test-v2021-08-07 0.79684 65.2 10947 87335
|
295 |
+
ron-deu tatoeba-test-v2021-08-07 0.68217 50.3 1141 7893
|
296 |
+
ron-eng tatoeba-test-v2021-08-07 0.73059 59.0 5508 40717
|
297 |
+
ron-fra tatoeba-test-v2021-08-07 0.70724 54.1 1925 13347
|
298 |
+
ron-por tatoeba-test-v2021-08-07 0.73085 53.3 681 4593
|
299 |
+
ron-spa tatoeba-test-v2021-08-07 0.73813 57.6 1959 12679
|
300 |
+
spa-deu tatoeba-test-v2021-08-07 0.68124 49.3 10521 86430
|
301 |
+
spa-eng tatoeba-test-v2021-08-07 0.74977 61.0 16583 138123
|
302 |
+
spa-fra tatoeba-test-v2021-08-07 0.73392 56.6 10294 83501
|
303 |
+
spa-por tatoeba-test-v2021-08-07 0.77280 61.1 10947 87610
|
304 |
+
spa-spa tatoeba-test-v2021-08-07 0.68111 50.9 2500 21469
|
305 |
+
fra-eng tico19-test 0.62364 39.7 2100 56323
|
306 |
+
fra-por tico19-test 0.58563 34.2 2100 62729
|
307 |
+
fra-spa tico19-test 0.59556 36.5 2100 66563
|
308 |
+
por-eng tico19-test 0.74420 51.8 2100 56315
|
309 |
+
por-fra tico19-test 0.60081 34.5 2100 64661
|
310 |
+
por-spa tico19-test 0.68156 44.8 2100 66563
|
311 |
+
spa-eng tico19-test 0.73454 50.3 2100 56315
|
312 |
+
spa-fra tico19-test 0.60441 34.9 2100 64661
|
313 |
+
spa-por tico19-test 0.67749 42.7 2100 62729
|
benchmark_translations.zip
ADDED
File without changes
|
config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "pytorch-models/opus-mt-tc-bible-big-itc-deu_eng_fra_por_spa",
|
3 |
+
"activation_dropout": 0.0,
|
4 |
+
"activation_function": "relu",
|
5 |
+
"architectures": [
|
6 |
+
"MarianMTModel"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 0,
|
10 |
+
"classifier_dropout": 0.0,
|
11 |
+
"d_model": 1024,
|
12 |
+
"decoder_attention_heads": 16,
|
13 |
+
"decoder_ffn_dim": 4096,
|
14 |
+
"decoder_layerdrop": 0.0,
|
15 |
+
"decoder_layers": 6,
|
16 |
+
"decoder_start_token_id": 45340,
|
17 |
+
"decoder_vocab_size": 45341,
|
18 |
+
"dropout": 0.1,
|
19 |
+
"encoder_attention_heads": 16,
|
20 |
+
"encoder_ffn_dim": 4096,
|
21 |
+
"encoder_layerdrop": 0.0,
|
22 |
+
"encoder_layers": 6,
|
23 |
+
"eos_token_id": 456,
|
24 |
+
"forced_eos_token_id": null,
|
25 |
+
"init_std": 0.02,
|
26 |
+
"is_encoder_decoder": true,
|
27 |
+
"max_length": null,
|
28 |
+
"max_position_embeddings": 1024,
|
29 |
+
"model_type": "marian",
|
30 |
+
"normalize_embedding": false,
|
31 |
+
"num_beams": null,
|
32 |
+
"num_hidden_layers": 6,
|
33 |
+
"pad_token_id": 45340,
|
34 |
+
"scale_embedding": true,
|
35 |
+
"share_encoder_decoder_embeddings": true,
|
36 |
+
"static_position_embeddings": true,
|
37 |
+
"torch_dtype": "float32",
|
38 |
+
"transformers_version": "4.45.1",
|
39 |
+
"use_cache": true,
|
40 |
+
"vocab_size": 45341
|
41 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bad_words_ids": [
|
4 |
+
[
|
5 |
+
45340
|
6 |
+
]
|
7 |
+
],
|
8 |
+
"bos_token_id": 0,
|
9 |
+
"decoder_start_token_id": 45340,
|
10 |
+
"eos_token_id": 456,
|
11 |
+
"forced_eos_token_id": 456,
|
12 |
+
"max_length": 512,
|
13 |
+
"num_beams": 4,
|
14 |
+
"pad_token_id": 45340,
|
15 |
+
"transformers_version": "4.45.1"
|
16 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da04ff3a6f81336247162a8181522179b6f0449f88dbb6718b4121bce52565dc
|
3 |
+
size 891357220
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f353c12a68dfaa832334782cb051e2366d1cfa987dcb79cf6ccbb124a820fa5e
|
3 |
+
size 891408453
|
source.spm
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de5d95ad9b90d3e6df60681716862521db8f36b0c6afa158dee6592eef0e1ad
|
3 |
+
size 804986
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
|
target.spm
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b1dadb2fa563686bd76dc848270a88de8e1b5f1cb3b9255ff8b09150d309f91
|
3 |
+
size 807512
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"source_lang": "itc", "target_lang": "deu+eng+fra+por+spa", "unk_token": "<unk>", "eos_token": "</s>", "pad_token": "<pad>", "model_max_length": 512, "sp_model_kwargs": {}, "separate_vocabs": false, "special_tokens_map_file": null, "name_or_path": "marian-models/opusTCv20230926max50+bt+jhubc_transformer-big_2024-05-30/itc-deu+eng+fra+por+spa", "tokenizer_class": "MarianTokenizer"}
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|