anton-l HF staff commited on
Commit
b9380a2
1 Parent(s): de071fe

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,320 @@
1
  {
2
  "epoch": 4.07,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "train_loss": 5.854813561474184e-06,
4
- "train_runtime": 574.8329,
5
  "train_samples": 246408,
6
- "train_samples_per_second": 2143.301,
7
- "train_steps_per_second": 33.497
8
  }
1
  {
2
  "epoch": 4.07,
3
+ "epoch_af_za": 4.07,
4
+ "epoch_am_et": 4.07,
5
+ "epoch_ar_eg": 4.07,
6
+ "epoch_as_in": 4.07,
7
+ "epoch_ast_es": 4.07,
8
+ "epoch_az_az": 4.07,
9
+ "epoch_be_by": 4.07,
10
+ "epoch_bn_in": 4.07,
11
+ "epoch_bs_ba": 4.07,
12
+ "epoch_ca_es": 4.07,
13
+ "epoch_ceb_ph": 4.07,
14
+ "epoch_cmn_hans_cn": 4.07,
15
+ "epoch_cs_cz": 4.07,
16
+ "epoch_cy_gb": 4.07,
17
+ "epoch_da_dk": 4.07,
18
+ "epoch_de_de": 4.07,
19
+ "epoch_el_gr": 4.07,
20
+ "epoch_en_us": 4.07,
21
+ "epoch_es_419": 4.07,
22
+ "epoch_et_ee": 4.07,
23
+ "epoch_fa_ir": 4.07,
24
+ "epoch_ff_sn": 4.07,
25
+ "epoch_fi_fi": 4.07,
26
+ "epoch_fil_ph": 4.07,
27
+ "epoch_fr_fr": 4.07,
28
+ "epoch_ga_ie": 4.07,
29
+ "epoch_gl_es": 4.07,
30
+ "epoch_gu_in": 4.07,
31
+ "epoch_ha_ng": 4.07,
32
+ "epoch_he_il": 4.07,
33
+ "epoch_hi_in": 4.07,
34
+ "epoch_hr_hr": 4.07,
35
+ "epoch_hu_hu": 4.07,
36
+ "epoch_hy_am": 4.07,
37
+ "epoch_id_id": 4.07,
38
+ "epoch_ig_ng": 4.07,
39
+ "epoch_is_is": 4.07,
40
+ "epoch_it_it": 4.07,
41
+ "epoch_ja_jp": 4.07,
42
+ "epoch_jv_id": 4.07,
43
+ "epoch_ka_ge": 4.07,
44
+ "epoch_kam_ke": 4.07,
45
+ "epoch_kea_cv": 4.07,
46
+ "epoch_kk_kz": 4.07,
47
+ "epoch_km_kh": 4.07,
48
+ "epoch_kn_in": 4.07,
49
+ "epoch_ko_kr": 4.07,
50
+ "epoch_ku_arab_iq": 4.07,
51
+ "epoch_ky_kg": 4.07,
52
+ "epoch_lb_lu": 4.07,
53
+ "epoch_lg_ug": 4.07,
54
+ "epoch_ln_cd": 4.07,
55
+ "epoch_lo_la": 4.07,
56
+ "epoch_lt_lt": 4.07,
57
+ "epoch_luo_ke": 4.07,
58
+ "epoch_lv_lv": 4.07,
59
+ "epoch_mi_nz": 4.07,
60
+ "epoch_mk_mk": 4.07,
61
+ "epoch_ml_in": 4.07,
62
+ "epoch_mn_mn": 4.07,
63
+ "epoch_mr_in": 4.07,
64
+ "epoch_ms_my": 4.07,
65
+ "epoch_mt_mt": 4.07,
66
+ "epoch_my_mm": 4.07,
67
+ "epoch_nb_no": 4.07,
68
+ "epoch_ne_np": 4.07,
69
+ "epoch_nl_nl": 4.07,
70
+ "epoch_nso_za": 4.07,
71
+ "epoch_ny_mw": 4.07,
72
+ "epoch_oci_fr": 4.07,
73
+ "epoch_om_et": 4.07,
74
+ "epoch_or_in": 4.07,
75
+ "epoch_pa_in": 4.07,
76
+ "epoch_pl_pl": 4.07,
77
+ "epoch_ps_af": 4.07,
78
+ "epoch_pt_br": 4.07,
79
+ "epoch_ro_ro": 4.07,
80
+ "epoch_ru_ru": 4.07,
81
+ "epoch_rup_bg": 4.07,
82
+ "epoch_sd_arab_in": 4.07,
83
+ "epoch_sk_sk": 4.07,
84
+ "epoch_sl_si": 4.07,
85
+ "epoch_sn_zw": 4.07,
86
+ "epoch_so_so": 4.07,
87
+ "epoch_sr_rs": 4.07,
88
+ "epoch_sv_se": 4.07,
89
+ "epoch_sw_ke": 4.07,
90
+ "epoch_ta_in": 4.07,
91
+ "epoch_te_in": 4.07,
92
+ "epoch_tg_tj": 4.07,
93
+ "epoch_th_th": 4.07,
94
+ "epoch_tr_tr": 4.07,
95
+ "epoch_uk_ua": 4.07,
96
+ "epoch_umb_ao": 4.07,
97
+ "epoch_ur_pk": 4.07,
98
+ "epoch_uz_uz": 4.07,
99
+ "epoch_vi_vn": 4.07,
100
+ "epoch_wo_sn": 4.07,
101
+ "epoch_xh_za": 4.07,
102
+ "epoch_yo_ng": 4.07,
103
+ "epoch_yue_hant_hk": 4.07,
104
+ "epoch_zu_za": 4.07,
105
+ "eval_accuracy": 0.7271468398716529,
106
+ "eval_accuracy_af_za": 0.3864734299516908,
107
+ "eval_accuracy_am_et": 0.8817829457364341,
108
+ "eval_accuracy_ar_eg": 0.9976635514018691,
109
+ "eval_accuracy_as_in": 0.9857723577235772,
110
+ "eval_accuracy_ast_es": 0.8361522198731501,
111
+ "eval_accuracy_az_az": 0.838569880823402,
112
+ "eval_accuracy_be_by": 0.40847983453981385,
113
+ "eval_accuracy_bn_in": 0.9989130434782608,
114
+ "eval_accuracy_bs_ba": 0.2508108108108108,
115
+ "eval_accuracy_ca_es": 0.6946808510638298,
116
+ "eval_accuracy_ceb_ph": 0.9852125693160814,
117
+ "eval_accuracy_cmn_hans_cn": 0.9798941798941799,
118
+ "eval_accuracy_cs_cz": 0.5352697095435685,
119
+ "eval_accuracy_cy_gb": 0.9715964740450539,
120
+ "eval_accuracy_da_dk": 0.6688172043010753,
121
+ "eval_accuracy_de_de": 0.7807424593967517,
122
+ "eval_accuracy_el_gr": 0.7692307692307693,
123
+ "eval_accuracy_en_us": 0.98145285935085,
124
+ "eval_accuracy_es_419": 0.9845814977973568,
125
+ "eval_accuracy_et_ee": 0.522956326987682,
126
+ "eval_accuracy_fa_ir": 0.8461538461538461,
127
+ "eval_accuracy_ff_sn": 0.23484848484848486,
128
+ "eval_accuracy_fi_fi": 0.9978213507625272,
129
+ "eval_accuracy_fil_ph": 0.9564315352697096,
130
+ "eval_accuracy_fr_fr": 0.985207100591716,
131
+ "eval_accuracy_ga_ie": 0.8467933491686461,
132
+ "eval_accuracy_gl_es": 0.5016181229773463,
133
+ "eval_accuracy_gu_in": 0.973,
134
+ "eval_accuracy_ha_ng": 0.9162640901771336,
135
+ "eval_accuracy_he_il": 0.8042929292929293,
136
+ "eval_accuracy_hi_in": 0.9354066985645934,
137
+ "eval_accuracy_hr_hr": 0.36542669584245074,
138
+ "eval_accuracy_hu_hu": 0.8044198895027624,
139
+ "eval_accuracy_hy_am": 0.9914163090128756,
140
+ "eval_accuracy_id_id": 0.9868995633187773,
141
+ "eval_accuracy_ig_ng": 0.936016511867905,
142
+ "eval_accuracy_is_is": 0.021739130434782608,
143
+ "eval_accuracy_it_it": 0.8,
144
+ "eval_accuracy_ja_jp": 0.7384615384615385,
145
+ "eval_accuracy_jv_id": 0.5824175824175825,
146
+ "eval_accuracy_ka_ge": 0.8610827374872319,
147
+ "eval_accuracy_kam_ke": 0.4183796856106409,
148
+ "eval_accuracy_kea_cv": 0.8692129629629629,
149
+ "eval_accuracy_kk_kz": 0.8726635514018691,
150
+ "eval_accuracy_km_kh": 0.7029831387808041,
151
+ "eval_accuracy_kn_in": 0.9630071599045346,
152
+ "eval_accuracy_ko_kr": 0.9842931937172775,
153
+ "eval_accuracy_ku_arab_iq": 0.9577006507592191,
154
+ "eval_accuracy_ky_kg": 0.8935516888433982,
155
+ "eval_accuracy_lb_lu": 0.8897216274089935,
156
+ "eval_accuracy_lg_ug": 0.9253112033195021,
157
+ "eval_accuracy_ln_cd": 0.9644351464435147,
158
+ "eval_accuracy_lo_la": 0.1580246913580247,
159
+ "eval_accuracy_lt_lt": 0.4685598377281947,
160
+ "eval_accuracy_luo_ke": 0.9921875,
161
+ "eval_accuracy_lv_lv": 0.6498237367802585,
162
+ "eval_accuracy_mi_nz": 0.9613095238095238,
163
+ "eval_accuracy_mk_mk": 0.763617677286742,
164
+ "eval_accuracy_ml_in": 0.6962421711899791,
165
+ "eval_accuracy_mn_mn": 0.8461538461538461,
166
+ "eval_accuracy_mr_in": 0.39113300492610836,
167
+ "eval_accuracy_ms_my": 0.36315086782376504,
168
+ "eval_accuracy_mt_mt": 0.6187904967602592,
169
+ "eval_accuracy_my_mm": 0.9704545454545455,
170
+ "eval_accuracy_nb_no": 0.6890756302521008,
171
+ "eval_accuracy_ne_np": 0.8994490358126722,
172
+ "eval_accuracy_nl_nl": 0.9093406593406593,
173
+ "eval_accuracy_nso_za": 0.8873417721518987,
174
+ "eval_accuracy_ny_mw": 0.469119579500657,
175
+ "eval_accuracy_oci_fr": 0.1533066132264529,
176
+ "eval_accuracy_om_et": 0.9512195121951219,
177
+ "eval_accuracy_or_in": 0.5447338618346546,
178
+ "eval_accuracy_pa_in": 0.8153310104529616,
179
+ "eval_accuracy_pl_pl": 0.7757255936675461,
180
+ "eval_accuracy_ps_af": 0.810546875,
181
+ "eval_accuracy_pt_br": 0.7714907508161044,
182
+ "eval_accuracy_ro_ro": 0.41223103057757643,
183
+ "eval_accuracy_ru_ru": 0.9793548387096774,
184
+ "eval_accuracy_rup_bg": 0.9468085106382979,
185
+ "eval_accuracy_sd_arab_in": 0.5244897959183673,
186
+ "eval_accuracy_sk_sk": 0.8623737373737373,
187
+ "eval_accuracy_sl_si": 0.02997601918465228,
188
+ "eval_accuracy_sn_zw": 0.8843243243243243,
189
+ "eval_accuracy_so_so": 0.8802747791952895,
190
+ "eval_accuracy_sr_rs": 0.025714285714285714,
191
+ "eval_accuracy_sv_se": 0.014492753623188406,
192
+ "eval_accuracy_sw_ke": 0.919917864476386,
193
+ "eval_accuracy_ta_in": 0.9526226734348562,
194
+ "eval_accuracy_te_in": 0.9788135593220338,
195
+ "eval_accuracy_tg_tj": 0.9883333333333333,
196
+ "eval_accuracy_th_th": 0.9911851126346719,
197
+ "eval_accuracy_tr_tr": 0.7886944818304172,
198
+ "eval_accuracy_uk_ua": 0.06266666666666666,
199
+ "eval_accuracy_umb_ao": 0.7862796833773087,
200
+ "eval_accuracy_ur_pk": 0.013377926421404682,
201
+ "eval_accuracy_uz_uz": 0.4013921113689095,
202
+ "eval_accuracy_vi_vn": 0.7246207701283547,
203
+ "eval_accuracy_wo_sn": 0.4555256064690027,
204
+ "eval_accuracy_xh_za": 1.0,
205
+ "eval_accuracy_yo_ng": 0.7352587244283996,
206
+ "eval_accuracy_yue_hant_hk": 0.7985347985347986,
207
+ "eval_accuracy_zu_za": 0.46955503512880564,
208
+ "eval_loss": 1.378929700578024,
209
+ "eval_loss_af_za": 2.6778101921081543,
210
+ "eval_loss_am_et": 0.46154311299324036,
211
+ "eval_loss_ar_eg": 0.014941702596843243,
212
+ "eval_loss_as_in": 0.07641631364822388,
213
+ "eval_loss_ast_es": 0.4559924304485321,
214
+ "eval_loss_az_az": 0.5676775574684143,
215
+ "eval_loss_be_by": 1.9230682849884033,
216
+ "eval_loss_bn_in": 0.002447569975629449,
217
+ "eval_loss_bs_ba": 2.4953715801239014,
218
+ "eval_loss_ca_es": 1.2631815671920776,
219
+ "eval_loss_ceb_ph": 0.04263082891702652,
220
+ "eval_loss_cmn_hans_cn": 0.06501840800046921,
221
+ "eval_loss_cs_cz": 1.9333536624908447,
222
+ "eval_loss_cy_gb": 0.1273733228445053,
223
+ "eval_loss_da_dk": 1.4990081787109375,
224
+ "eval_loss_de_de": 0.8820119500160217,
225
+ "eval_loss_el_gr": 0.9838642477989197,
226
+ "eval_loss_en_us": 0.08269134163856506,
227
+ "eval_loss_es_419": 0.05156087502837181,
228
+ "eval_loss_et_ee": 1.9264016151428223,
229
+ "eval_loss_fa_ir": 0.6519789695739746,
230
+ "eval_loss_ff_sn": 5.428281307220459,
231
+ "eval_loss_fi_fi": 0.010886545293033123,
232
+ "eval_loss_fil_ph": 0.17060022056102753,
233
+ "eval_loss_fr_fr": 0.0590590201318264,
234
+ "eval_loss_ga_ie": 0.5173550248146057,
235
+ "eval_loss_gl_es": 1.2657122611999512,
236
+ "eval_loss_gu_in": 0.08499378710985184,
237
+ "eval_loss_ha_ng": 0.3233623802661896,
238
+ "eval_loss_he_il": 0.8299161195755005,
239
+ "eval_loss_hi_in": 0.4189773201942444,
240
+ "eval_loss_hr_hr": 2.9754278659820557,
241
+ "eval_loss_hu_hu": 0.8344607949256897,
242
+ "eval_loss_hy_am": 0.03288033604621887,
243
+ "eval_loss_id_id": 0.05292920395731926,
244
+ "eval_loss_ig_ng": 0.25233691930770874,
245
+ "eval_loss_is_is": 6.5153117179870605,
246
+ "eval_loss_it_it": 0.8113388419151306,
247
+ "eval_loss_ja_jp": 1.396775245666504,
248
+ "eval_loss_jv_id": 2.0009281635284424,
249
+ "eval_loss_ka_ge": 0.6161583065986633,
250
+ "eval_loss_kam_ke": 2.219219446182251,
251
+ "eval_loss_kea_cv": 0.5567307472229004,
252
+ "eval_loss_kk_kz": 0.5592476725578308,
253
+ "eval_loss_km_kh": 1.7357780933380127,
254
+ "eval_loss_kn_in": 0.10634830594062805,
255
+ "eval_loss_ko_kr": 0.151944100856781,
256
+ "eval_loss_ku_arab_iq": 0.2075168490409851,
257
+ "eval_loss_ky_kg": 0.46389031410217285,
258
+ "eval_loss_lb_lu": 0.44538378715515137,
259
+ "eval_loss_lg_ug": 0.37638625502586365,
260
+ "eval_loss_ln_cd": 0.18439875543117523,
261
+ "eval_loss_lo_la": 3.805140495300293,
262
+ "eval_loss_lt_lt": 2.5053646564483643,
263
+ "eval_loss_luo_ke": 0.047887783497571945,
264
+ "eval_loss_lv_lv": 1.3713427782058716,
265
+ "eval_loss_mi_nz": 0.13896487653255463,
266
+ "eval_loss_mk_mk": 0.7952373027801514,
267
+ "eval_loss_ml_in": 1.2999218702316284,
268
+ "eval_loss_mn_mn": 0.7620733976364136,
269
+ "eval_loss_mr_in": 3.705583095550537,
270
+ "eval_loss_ms_my": 3.0192301273345947,
271
+ "eval_loss_mt_mt": 1.5519871711730957,
272
+ "eval_loss_my_mm": 0.15139135718345642,
273
+ "eval_loss_nb_no": 1.1194071769714355,
274
+ "eval_loss_ne_np": 0.4230792224407196,
275
+ "eval_loss_nl_nl": 0.3290546238422394,
276
+ "eval_loss_nso_za": 0.510554313659668,
277
+ "eval_loss_ny_mw": 2.734614610671997,
278
+ "eval_loss_oci_fr": 5.098300933837891,
279
+ "eval_loss_om_et": 0.2296750545501709,
280
+ "eval_loss_or_in": 2.543181896209717,
281
+ "eval_loss_pa_in": 0.7753236293792725,
282
+ "eval_loss_pl_pl": 0.7309491634368896,
283
+ "eval_loss_ps_af": 1.0454343557357788,
284
+ "eval_loss_pt_br": 0.9782202243804932,
285
+ "eval_loss_ro_ro": 3.5829010009765625,
286
+ "eval_loss_ru_ru": 0.059757012873888016,
287
+ "eval_loss_rup_bg": 0.1694687306880951,
288
+ "eval_loss_sd_arab_in": 2.619832992553711,
289
+ "eval_loss_sk_sk": 0.5583317875862122,
290
+ "eval_loss_sl_si": 6.092343807220459,
291
+ "eval_loss_sn_zw": 0.44645825028419495,
292
+ "eval_loss_so_so": 0.4492073059082031,
293
+ "eval_loss_sr_rs": 4.757461071014404,
294
+ "eval_loss_sv_se": 6.585770130157471,
295
+ "eval_loss_sw_ke": 0.42353829741477966,
296
+ "eval_loss_ta_in": 0.18184617161750793,
297
+ "eval_loss_te_in": 0.08084087073802948,
298
+ "eval_loss_tg_tj": 0.0912216454744339,
299
+ "eval_loss_th_th": 0.04623497650027275,
300
+ "eval_loss_tr_tr": 0.7339828014373779,
301
+ "eval_loss_uk_ua": 4.67767858505249,
302
+ "eval_loss_umb_ao": 1.4020830392837524,
303
+ "eval_loss_ur_pk": 8.40671443939209,
304
+ "eval_loss_uz_uz": 4.329716682434082,
305
+ "eval_loss_vi_vn": 1.1303719282150269,
306
+ "eval_loss_wo_sn": 2.2281110286712646,
307
+ "eval_loss_xh_za": 0.0009458978893235326,
308
+ "eval_loss_yo_ng": 1.3345184326171875,
309
+ "eval_loss_yue_hant_hk": 1.072838306427002,
310
+ "eval_loss_zu_za": 3.7278547286987305,
311
+ "eval_runtime": 19.1831931372549,
312
+ "eval_samples_per_second": 41.44199019607843,
313
+ "eval_steps_per_second": 5.209764705882353,
314
+ "predict_samples": 77960,
315
  "train_loss": 5.854813561474184e-06,
316
+ "train_runtime": 568.9856,
317
  "train_samples": 246408,
318
+ "train_samples_per_second": 2165.327,
319
+ "train_steps_per_second": 33.841
320
  }
config.json CHANGED
@@ -307,7 +307,7 @@
307
  1,
308
  1
309
  ],
310
- "torch_dtype": "float32",
311
  "transformers_version": "4.18.0.dev0",
312
  "use_weighted_layer_sum": false,
313
  "vocab_size": 32,
307
  1,
308
  1
309
  ],
310
+ "torch_dtype": "float16",
311
  "transformers_version": "4.18.0.dev0",
312
  "use_weighted_layer_sum": false,
313
  "vocab_size": 32,
predict_results.json ADDED
@@ -0,0 +1,315 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.07,
3
+ "epoch_af_za": 4.07,
4
+ "epoch_am_et": 4.07,
5
+ "epoch_ar_eg": 4.07,
6
+ "epoch_as_in": 4.07,
7
+ "epoch_ast_es": 4.07,
8
+ "epoch_az_az": 4.07,
9
+ "epoch_be_by": 4.07,
10
+ "epoch_bn_in": 4.07,
11
+ "epoch_bs_ba": 4.07,
12
+ "epoch_ca_es": 4.07,
13
+ "epoch_ceb_ph": 4.07,
14
+ "epoch_cmn_hans_cn": 4.07,
15
+ "epoch_cs_cz": 4.07,
16
+ "epoch_cy_gb": 4.07,
17
+ "epoch_da_dk": 4.07,
18
+ "epoch_de_de": 4.07,
19
+ "epoch_el_gr": 4.07,
20
+ "epoch_en_us": 4.07,
21
+ "epoch_es_419": 4.07,
22
+ "epoch_et_ee": 4.07,
23
+ "epoch_fa_ir": 4.07,
24
+ "epoch_ff_sn": 4.07,
25
+ "epoch_fi_fi": 4.07,
26
+ "epoch_fil_ph": 4.07,
27
+ "epoch_fr_fr": 4.07,
28
+ "epoch_ga_ie": 4.07,
29
+ "epoch_gl_es": 4.07,
30
+ "epoch_gu_in": 4.07,
31
+ "epoch_ha_ng": 4.07,
32
+ "epoch_he_il": 4.07,
33
+ "epoch_hi_in": 4.07,
34
+ "epoch_hr_hr": 4.07,
35
+ "epoch_hu_hu": 4.07,
36
+ "epoch_hy_am": 4.07,
37
+ "epoch_id_id": 4.07,
38
+ "epoch_ig_ng": 4.07,
39
+ "epoch_is_is": 4.07,
40
+ "epoch_it_it": 4.07,
41
+ "epoch_ja_jp": 4.07,
42
+ "epoch_jv_id": 4.07,
43
+ "epoch_ka_ge": 4.07,
44
+ "epoch_kam_ke": 4.07,
45
+ "epoch_kea_cv": 4.07,
46
+ "epoch_kk_kz": 4.07,
47
+ "epoch_km_kh": 4.07,
48
+ "epoch_kn_in": 4.07,
49
+ "epoch_ko_kr": 4.07,
50
+ "epoch_ku_arab_iq": 4.07,
51
+ "epoch_ky_kg": 4.07,
52
+ "epoch_lb_lu": 4.07,
53
+ "epoch_lg_ug": 4.07,
54
+ "epoch_ln_cd": 4.07,
55
+ "epoch_lo_la": 4.07,
56
+ "epoch_lt_lt": 4.07,
57
+ "epoch_luo_ke": 4.07,
58
+ "epoch_lv_lv": 4.07,
59
+ "epoch_mi_nz": 4.07,
60
+ "epoch_mk_mk": 4.07,
61
+ "epoch_ml_in": 4.07,
62
+ "epoch_mn_mn": 4.07,
63
+ "epoch_mr_in": 4.07,
64
+ "epoch_ms_my": 4.07,
65
+ "epoch_mt_mt": 4.07,
66
+ "epoch_my_mm": 4.07,
67
+ "epoch_nb_no": 4.07,
68
+ "epoch_ne_np": 4.07,
69
+ "epoch_nl_nl": 4.07,
70
+ "epoch_nso_za": 4.07,
71
+ "epoch_ny_mw": 4.07,
72
+ "epoch_oci_fr": 4.07,
73
+ "epoch_om_et": 4.07,
74
+ "epoch_or_in": 4.07,
75
+ "epoch_pa_in": 4.07,
76
+ "epoch_pl_pl": 4.07,
77
+ "epoch_ps_af": 4.07,
78
+ "epoch_pt_br": 4.07,
79
+ "epoch_ro_ro": 4.07,
80
+ "epoch_ru_ru": 4.07,
81
+ "epoch_rup_bg": 4.07,
82
+ "epoch_sd_arab_in": 4.07,
83
+ "epoch_sk_sk": 4.07,
84
+ "epoch_sl_si": 4.07,
85
+ "epoch_sn_zw": 4.07,
86
+ "epoch_so_so": 4.07,
87
+ "epoch_sr_rs": 4.07,
88
+ "epoch_sv_se": 4.07,
89
+ "epoch_sw_ke": 4.07,
90
+ "epoch_ta_in": 4.07,
91
+ "epoch_te_in": 4.07,
92
+ "epoch_tg_tj": 4.07,
93
+ "epoch_th_th": 4.07,
94
+ "epoch_tr_tr": 4.07,
95
+ "epoch_uk_ua": 4.07,
96
+ "epoch_umb_ao": 4.07,
97
+ "epoch_ur_pk": 4.07,
98
+ "epoch_uz_uz": 4.07,
99
+ "epoch_vi_vn": 4.07,
100
+ "epoch_wo_sn": 4.07,
101
+ "epoch_xh_za": 4.07,
102
+ "epoch_yo_ng": 4.07,
103
+ "epoch_yue_hant_hk": 4.07,
104
+ "epoch_zu_za": 4.07,
105
+ "eval_accuracy": 0.7271468398716529,
106
+ "eval_accuracy_af_za": 0.3864734299516908,
107
+ "eval_accuracy_am_et": 0.8817829457364341,
108
+ "eval_accuracy_ar_eg": 0.9976635514018691,
109
+ "eval_accuracy_as_in": 0.9857723577235772,
110
+ "eval_accuracy_ast_es": 0.8361522198731501,
111
+ "eval_accuracy_az_az": 0.838569880823402,
112
+ "eval_accuracy_be_by": 0.40847983453981385,
113
+ "eval_accuracy_bn_in": 0.9989130434782608,
114
+ "eval_accuracy_bs_ba": 0.2508108108108108,
115
+ "eval_accuracy_ca_es": 0.6946808510638298,
116
+ "eval_accuracy_ceb_ph": 0.9852125693160814,
117
+ "eval_accuracy_cmn_hans_cn": 0.9798941798941799,
118
+ "eval_accuracy_cs_cz": 0.5352697095435685,
119
+ "eval_accuracy_cy_gb": 0.9715964740450539,
120
+ "eval_accuracy_da_dk": 0.6688172043010753,
121
+ "eval_accuracy_de_de": 0.7807424593967517,
122
+ "eval_accuracy_el_gr": 0.7692307692307693,
123
+ "eval_accuracy_en_us": 0.98145285935085,
124
+ "eval_accuracy_es_419": 0.9845814977973568,
125
+ "eval_accuracy_et_ee": 0.522956326987682,
126
+ "eval_accuracy_fa_ir": 0.8461538461538461,
127
+ "eval_accuracy_ff_sn": 0.23484848484848486,
128
+ "eval_accuracy_fi_fi": 0.9978213507625272,
129
+ "eval_accuracy_fil_ph": 0.9564315352697096,
130
+ "eval_accuracy_fr_fr": 0.985207100591716,
131
+ "eval_accuracy_ga_ie": 0.8467933491686461,
132
+ "eval_accuracy_gl_es": 0.5016181229773463,
133
+ "eval_accuracy_gu_in": 0.973,
134
+ "eval_accuracy_ha_ng": 0.9162640901771336,
135
+ "eval_accuracy_he_il": 0.8042929292929293,
136
+ "eval_accuracy_hi_in": 0.9354066985645934,
137
+ "eval_accuracy_hr_hr": 0.36542669584245074,
138
+ "eval_accuracy_hu_hu": 0.8044198895027624,
139
+ "eval_accuracy_hy_am": 0.9914163090128756,
140
+ "eval_accuracy_id_id": 0.9868995633187773,
141
+ "eval_accuracy_ig_ng": 0.936016511867905,
142
+ "eval_accuracy_is_is": 0.021739130434782608,
143
+ "eval_accuracy_it_it": 0.8,
144
+ "eval_accuracy_ja_jp": 0.7384615384615385,
145
+ "eval_accuracy_jv_id": 0.5824175824175825,
146
+ "eval_accuracy_ka_ge": 0.8610827374872319,
147
+ "eval_accuracy_kam_ke": 0.4183796856106409,
148
+ "eval_accuracy_kea_cv": 0.8692129629629629,
149
+ "eval_accuracy_kk_kz": 0.8726635514018691,
150
+ "eval_accuracy_km_kh": 0.7029831387808041,
151
+ "eval_accuracy_kn_in": 0.9630071599045346,
152
+ "eval_accuracy_ko_kr": 0.9842931937172775,
153
+ "eval_accuracy_ku_arab_iq": 0.9577006507592191,
154
+ "eval_accuracy_ky_kg": 0.8935516888433982,
155
+ "eval_accuracy_lb_lu": 0.8897216274089935,
156
+ "eval_accuracy_lg_ug": 0.9253112033195021,
157
+ "eval_accuracy_ln_cd": 0.9644351464435147,
158
+ "eval_accuracy_lo_la": 0.1580246913580247,
159
+ "eval_accuracy_lt_lt": 0.4685598377281947,
160
+ "eval_accuracy_luo_ke": 0.9921875,
161
+ "eval_accuracy_lv_lv": 0.6498237367802585,
162
+ "eval_accuracy_mi_nz": 0.9613095238095238,
163
+ "eval_accuracy_mk_mk": 0.763617677286742,
164
+ "eval_accuracy_ml_in": 0.6962421711899791,
165
+ "eval_accuracy_mn_mn": 0.8461538461538461,
166
+ "eval_accuracy_mr_in": 0.39113300492610836,
167
+ "eval_accuracy_ms_my": 0.36315086782376504,
168
+ "eval_accuracy_mt_mt": 0.6187904967602592,
169
+ "eval_accuracy_my_mm": 0.9704545454545455,
170
+ "eval_accuracy_nb_no": 0.6890756302521008,
171
+ "eval_accuracy_ne_np": 0.8994490358126722,
172
+ "eval_accuracy_nl_nl": 0.9093406593406593,
173
+ "eval_accuracy_nso_za": 0.8873417721518987,
174
+ "eval_accuracy_ny_mw": 0.469119579500657,
175
+ "eval_accuracy_oci_fr": 0.1533066132264529,
176
+ "eval_accuracy_om_et": 0.9512195121951219,
177
+ "eval_accuracy_or_in": 0.5447338618346546,
178
+ "eval_accuracy_pa_in": 0.8153310104529616,
179
+ "eval_accuracy_pl_pl": 0.7757255936675461,
180
+ "eval_accuracy_ps_af": 0.810546875,
181
+ "eval_accuracy_pt_br": 0.7714907508161044,
182
+ "eval_accuracy_ro_ro": 0.41223103057757643,
183
+ "eval_accuracy_ru_ru": 0.9793548387096774,
184
+ "eval_accuracy_rup_bg": 0.9468085106382979,
185
+ "eval_accuracy_sd_arab_in": 0.5244897959183673,
186
+ "eval_accuracy_sk_sk": 0.8623737373737373,
187
+ "eval_accuracy_sl_si": 0.02997601918465228,
188
+ "eval_accuracy_sn_zw": 0.8843243243243243,
189
+ "eval_accuracy_so_so": 0.8802747791952895,
190
+ "eval_accuracy_sr_rs": 0.025714285714285714,
191
+ "eval_accuracy_sv_se": 0.014492753623188406,
192
+ "eval_accuracy_sw_ke": 0.919917864476386,
193
+ "eval_accuracy_ta_in": 0.9526226734348562,
194
+ "eval_accuracy_te_in": 0.9788135593220338,
195
+ "eval_accuracy_tg_tj": 0.9883333333333333,
196
+ "eval_accuracy_th_th": 0.9911851126346719,
197
+ "eval_accuracy_tr_tr": 0.7886944818304172,
198
+ "eval_accuracy_uk_ua": 0.06266666666666666,
199
+ "eval_accuracy_umb_ao": 0.7862796833773087,
200
+ "eval_accuracy_ur_pk": 0.013377926421404682,
201
+ "eval_accuracy_uz_uz": 0.4013921113689095,
202
+ "eval_accuracy_vi_vn": 0.7246207701283547,
203
+ "eval_accuracy_wo_sn": 0.4555256064690027,
204
+ "eval_accuracy_xh_za": 1.0,
205
+ "eval_accuracy_yo_ng": 0.7352587244283996,
206
+ "eval_accuracy_yue_hant_hk": 0.7985347985347986,
207
+ "eval_accuracy_zu_za": 0.46955503512880564,
208
+ "eval_loss": 1.378929700578024,
209
+ "eval_loss_af_za": 2.6778101921081543,
210
+ "eval_loss_am_et": 0.46154311299324036,
211
+ "eval_loss_ar_eg": 0.014941702596843243,
212
+ "eval_loss_as_in": 0.07641631364822388,
213
+ "eval_loss_ast_es": 0.4559924304485321,
214
+ "eval_loss_az_az": 0.5676775574684143,
215
+ "eval_loss_be_by": 1.9230682849884033,
216
+ "eval_loss_bn_in": 0.002447569975629449,
217
+ "eval_loss_bs_ba": 2.4953715801239014,
218
+ "eval_loss_ca_es": 1.2631815671920776,
219
+ "eval_loss_ceb_ph": 0.04263082891702652,
220
+ "eval_loss_cmn_hans_cn": 0.06501840800046921,
221
+ "eval_loss_cs_cz": 1.9333536624908447,
222
+ "eval_loss_cy_gb": 0.1273733228445053,
223
+ "eval_loss_da_dk": 1.4990081787109375,
224
+ "eval_loss_de_de": 0.8820119500160217,
225
+ "eval_loss_el_gr": 0.9838642477989197,
226
+ "eval_loss_en_us": 0.08269134163856506,
227
+ "eval_loss_es_419": 0.05156087502837181,
228
+ "eval_loss_et_ee": 1.9264016151428223,
229
+ "eval_loss_fa_ir": 0.6519789695739746,
230
+ "eval_loss_ff_sn": 5.428281307220459,
231
+ "eval_loss_fi_fi": 0.010886545293033123,
232
+ "eval_loss_fil_ph": 0.17060022056102753,
233
+ "eval_loss_fr_fr": 0.0590590201318264,
234
+ "eval_loss_ga_ie": 0.5173550248146057,
235
+ "eval_loss_gl_es": 1.2657122611999512,
236
+ "eval_loss_gu_in": 0.08499378710985184,
237
+ "eval_loss_ha_ng": 0.3233623802661896,
238
+ "eval_loss_he_il": 0.8299161195755005,
239
+ "eval_loss_hi_in": 0.4189773201942444,
240
+ "eval_loss_hr_hr": 2.9754278659820557,
241
+ "eval_loss_hu_hu": 0.8344607949256897,
242
+ "eval_loss_hy_am": 0.03288033604621887,
243
+ "eval_loss_id_id": 0.05292920395731926,
244
+ "eval_loss_ig_ng": 0.25233691930770874,
245
+ "eval_loss_is_is": 6.5153117179870605,
246
+ "eval_loss_it_it": 0.8113388419151306,
247
+ "eval_loss_ja_jp": 1.396775245666504,
248
+ "eval_loss_jv_id": 2.0009281635284424,
249
+ "eval_loss_ka_ge": 0.6161583065986633,
250
+ "eval_loss_kam_ke": 2.219219446182251,
251
+ "eval_loss_kea_cv": 0.5567307472229004,
252
+ "eval_loss_kk_kz": 0.5592476725578308,
253
+ "eval_loss_km_kh": 1.7357780933380127,
254
+ "eval_loss_kn_in": 0.10634830594062805,
255
+ "eval_loss_ko_kr": 0.151944100856781,
256
+ "eval_loss_ku_arab_iq": 0.2075168490409851,
257
+ "eval_loss_ky_kg": 0.46389031410217285,
258
+ "eval_loss_lb_lu": 0.44538378715515137,
259
+ "eval_loss_lg_ug": 0.37638625502586365,
260
+ "eval_loss_ln_cd": 0.18439875543117523,
261
+ "eval_loss_lo_la": 3.805140495300293,
262
+ "eval_loss_lt_lt": 2.5053646564483643,
263
+ "eval_loss_luo_ke": 0.047887783497571945,
264
+ "eval_loss_lv_lv": 1.3713427782058716,
265
+ "eval_loss_mi_nz": 0.13896487653255463,
266
+ "eval_loss_mk_mk": 0.7952373027801514,
267
+ "eval_loss_ml_in": 1.2999218702316284,
268
+ "eval_loss_mn_mn": 0.7620733976364136,
269
+ "eval_loss_mr_in": 3.705583095550537,
270
+ "eval_loss_ms_my": 3.0192301273345947,
271
+ "eval_loss_mt_mt": 1.5519871711730957,
272
+ "eval_loss_my_mm": 0.15139135718345642,
273
+ "eval_loss_nb_no": 1.1194071769714355,
274
+ "eval_loss_ne_np": 0.4230792224407196,
275
+ "eval_loss_nl_nl": 0.3290546238422394,
276
+ "eval_loss_nso_za": 0.510554313659668,
277
+ "eval_loss_ny_mw": 2.734614610671997,
278
+ "eval_loss_oci_fr": 5.098300933837891,
279
+ "eval_loss_om_et": 0.2296750545501709,
280
+ "eval_loss_or_in": 2.543181896209717,
281
+ "eval_loss_pa_in": 0.7753236293792725,
282
+ "eval_loss_pl_pl": 0.7309491634368896,
283
+ "eval_loss_ps_af": 1.0454343557357788,
284
+ "eval_loss_pt_br": 0.9782202243804932,
285
+ "eval_loss_ro_ro": 3.5829010009765625,
286
+ "eval_loss_ru_ru": 0.059757012873888016,
287
+ "eval_loss_rup_bg": 0.1694687306880951,
288
+ "eval_loss_sd_arab_in": 2.619832992553711,
289
+ "eval_loss_sk_sk": 0.5583317875862122,
290
+ "eval_loss_sl_si": 6.092343807220459,
291
+ "eval_loss_sn_zw": 0.44645825028419495,
292
+ "eval_loss_so_so": 0.4492073059082031,
293
+ "eval_loss_sr_rs": 4.757461071014404,
294
+ "eval_loss_sv_se": 6.585770130157471,
295
+ "eval_loss_sw_ke": 0.42353829741477966,
296
+ "eval_loss_ta_in": 0.18184617161750793,
297
+ "eval_loss_te_in": 0.08084087073802948,
298
+ "eval_loss_tg_tj": 0.0912216454744339,
299
+ "eval_loss_th_th": 0.04623497650027275,
300
+ "eval_loss_tr_tr": 0.7339828014373779,
301
+ "eval_loss_uk_ua": 4.67767858505249,
302
+ "eval_loss_umb_ao": 1.4020830392837524,
303
+ "eval_loss_ur_pk": 8.40671443939209,
304
+ "eval_loss_uz_uz": 4.329716682434082,
305
+ "eval_loss_vi_vn": 1.1303719282150269,
306
+ "eval_loss_wo_sn": 2.2281110286712646,
307
+ "eval_loss_xh_za": 0.0009458978893235326,
308
+ "eval_loss_yo_ng": 1.3345184326171875,
309
+ "eval_loss_yue_hant_hk": 1.072838306427002,
310
+ "eval_loss_zu_za": 3.7278547286987305,
311
+ "eval_runtime": 19.1831931372549,
312
+ "eval_samples_per_second": 41.44199019607843,
313
+ "eval_steps_per_second": 5.209764705882353,
314
+ "predict_samples": 77960
315
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8029c9175dccf3727ed80f0134cd1d993b75fd2c92abfe5d7c72caefc9b0344
3
- size 1263081325
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99336c858dfd8285c2f2c2d77a5ceff4d9f366a8ecb36ed5306946926dda1332
3
+ size 631626669
runs/Apr12_18-17-31_anton-xtreme-s/events.out.tfevents.1649788105.anton-xtreme-s.23063.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a42be21ca793d5d6279626701a8e99ef22e0229da5061ecad85267971e16269
3
+ size 51529
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.07,
3
  "train_loss": 5.854813561474184e-06,
4
- "train_runtime": 574.8329,
5
  "train_samples": 246408,
6
- "train_samples_per_second": 2143.301,
7
- "train_steps_per_second": 33.497
8
  }
1
  {
2
  "epoch": 4.07,
3
  "train_loss": 5.854813561474184e-06,
4
+ "train_runtime": 568.9856,
5
  "train_samples": 246408,
6
+ "train_samples_per_second": 2165.327,
7
+ "train_steps_per_second": 33.841
8
  }
trainer_state.json CHANGED
@@ -115713,9 +115713,9 @@
115713
  "step": 19255,
115714
  "total_flos": 4.709738606122584e+20,
115715
  "train_loss": 5.854813561474184e-06,
115716
- "train_runtime": 574.8329,
115717
- "train_samples_per_second": 2143.301,
115718
- "train_steps_per_second": 33.497
115719
  }
115720
  ],
115721
  "max_steps": 19255,
115713
  "step": 19255,
115714
  "total_flos": 4.709738606122584e+20,
115715
  "train_loss": 5.854813561474184e-06,
115716
+ "train_runtime": 568.9856,
115717
+ "train_samples_per_second": 2165.327,
115718
+ "train_steps_per_second": 33.841
115719
  }
115720
  ],
115721
  "max_steps": 19255,