diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,6009 @@ +{ + "best_metric": 50.9114, + "best_model_checkpoint": "/output/checkpoint-10000", + "epoch": 2.0, + "global_step": 15062, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0, + "loss": 11.2617, + "step": 1 + }, + { + "epoch": 0.0, + "eval_exact_match": 0.0, + "eval_exact_match_for_answerability_classification": 0.0, + "eval_exact_match_for_cause_effect_classification": 0.0, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 0.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 0.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 0.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 0.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 0.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 0.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 0.0, + "eval_exact_match_for_textual_entailment": 0.0, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 4.2644, + "eval_f1_for_answerability_classification": 1.8668, + "eval_f1_for_cause_effect_classification": 4.344, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 3.471, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 3.1606, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 3.6846, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 3.2959, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 2.4751, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 3.3739, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 2.7326, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 3.4745, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 3.1997, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 3.2799, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 5.1837, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 4.1242, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 3.8632, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 4.7895, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 3.4823, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 3.3336, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 2.0693, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 5.1318, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 4.1919, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 13.1647, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 2.3551, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 4.0293, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 2.7788, + "eval_f1_for_task396_persianqa_answerability_classification": 1.8668, + "eval_f1_for_task463_pasinlu_textual_entailment": 2.4353, + "eval_f1_for_task464_pasinlu_textual_entailment": 8.3545, + "eval_f1_for_task534_farstail_textual_entailment": 2.0874, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 6.9245, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 4.611, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 7.979, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 5.4811, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 6.9087, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 3.1593, + "eval_f1_for_task968_xcopa_cause_effect_classification": 4.2922, + "eval_f1_for_task969_xcopa_cause_effect_classification": 4.51, + "eval_f1_for_textual_entailment": 4.2924, + "eval_f1_for_title_generation": 4.1919, + "eval_gen_len": 111.9417, + "eval_global_step": 1, + "eval_loss": 14.192606925964355, + "eval_rouge1": 3.1222, + "eval_rouge1_for_answerability_classification": 2.0936, + "eval_rouge1_for_cause_effect_classification": 3.418, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 2.9198, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 2.1195, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 4.1343, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 2.2827, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 3.0535, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 2.5602, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 2.6335, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 2.631, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 3.7264, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 2.7074, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 4.5135, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 2.6166, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 3.5439, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 3.159, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 2.7565, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 2.2842, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 3.4868, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 3.3792, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 0.36, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 10.5917, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 1.8427, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 3.6141, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 2.0352, + "eval_rouge1_for_task396_persianqa_answerability_classification": 2.0936, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 2.3758, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 0.0491, + "eval_rouge1_for_task534_farstail_textual_entailment": 1.8557, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 3.5991, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 3.9341, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 4.1945, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 4.8076, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 4.1962, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 2.1487, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 4.0485, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 3.0208, + "eval_rouge1_for_textual_entailment": 1.4269, + "eval_rouge1_for_title_generation": 0.36, + "eval_rougeL": 3.1178, + "eval_rougeL_for_answerability_classification": 2.0936, + "eval_rougeL_for_cause_effect_classification": 3.413, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 2.9198, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 2.1195, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 4.1343, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 2.2827, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 3.0535, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 2.5602, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 2.6335, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 2.631, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 3.7264, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 2.7074, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 4.5135, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 2.6166, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 3.5439, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 3.159, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 2.7565, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 2.2842, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 3.4868, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 3.3792, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 0.36, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 10.474, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 1.8427, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 3.5796, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 2.0352, + "eval_rougeL_for_task396_persianqa_answerability_classification": 2.0936, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 2.3758, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 0.0491, + "eval_rougeL_for_task534_farstail_textual_entailment": 1.8557, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 3.5991, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 3.9341, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 4.1945, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 4.8076, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 4.1962, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 2.1487, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 4.0485, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 3.0208, + "eval_rougeL_for_textual_entailment": 1.4269, + "eval_rougeL_for_title_generation": 0.36, + "eval_runtime": 410.3185, + "eval_samples_per_second": 8.53, + "eval_steps_per_second": 0.134, + "step": 1 + }, + { + "epoch": 0.01, + "learning_rate": 5e-05, + "loss": 4.395, + "step": 50 + }, + { + "epoch": 0.01, + "eval_exact_match": 41.4857, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 44.5, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 20.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 5.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 0.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_textual_entailment": 22.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 44.8407, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 47.9961, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 8.2131, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 28.7008, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 15.5144, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 5.3294, + "eval_f1_for_task534_farstail_textual_entailment": 33.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 27.3333, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 33.3333, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_textual_entailment": 23.7765, + "eval_f1_for_title_generation": 8.2131, + "eval_gen_len": 2.8286, + "eval_global_step": 50, + "eval_loss": 0.9278950691223145, + "eval_rouge1": 44.6676, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 48.1566, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 1.6667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 28.4918, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 15.2061, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 41.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_textual_entailment": 22.3333, + "eval_rouge1_for_title_generation": 1.6667, + "eval_rougeL": 44.6676, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 48.1566, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 1.6667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 28.4918, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 15.2061, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 41.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_textual_entailment": 22.3333, + "eval_rougeL_for_title_generation": 1.6667, + "eval_runtime": 52.7494, + "eval_samples_per_second": 66.351, + "eval_steps_per_second": 1.043, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 5e-05, + "loss": 2.0981, + "step": 100 + }, + { + "epoch": 0.01, + "eval_exact_match": 46.2571, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 50.1, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 32.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 32.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 21.3333, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 50.3202, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 53.9093, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 11.4378, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.7794, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.9984, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 32.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 18.4906, + "eval_f1_for_task534_farstail_textual_entailment": 32.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 27.4969, + "eval_f1_for_title_generation": 11.4378, + "eval_gen_len": 3.4271, + "eval_global_step": 100, + "eval_loss": 0.5112689733505249, + "eval_rouge1": 47.4081, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 51.3773, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 2.9667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.0879, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.2301, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 32.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 32.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 21.6667, + "eval_rouge1_for_title_generation": 2.9667, + "eval_rougeL": 47.4034, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 51.3717, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 2.9667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.0879, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.0634, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 32.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 32.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 21.6667, + "eval_rougeL_for_title_generation": 2.9667, + "eval_runtime": 49.8187, + "eval_samples_per_second": 70.255, + "eval_steps_per_second": 1.104, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 5e-05, + "loss": 1.903, + "step": 200 + }, + { + "epoch": 0.03, + "eval_exact_match": 45.3714, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 49.0333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 18.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 31.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 21.6667, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 49.5606, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 52.8281, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 9.8754, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 71.8608, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 37.9808, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 24.903, + "eval_f1_for_task534_farstail_textual_entailment": 31.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 29.9677, + "eval_f1_for_title_generation": 9.8754, + "eval_gen_len": 3.4326, + "eval_global_step": 200, + "eval_loss": 0.4994029104709625, + "eval_rouge1": 46.5531, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 50.3136, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 3.45, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 71.5543, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.8534, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 31.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 22.1667, + "eval_rouge1_for_title_generation": 3.45, + "eval_rougeL": 46.5374, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 50.3036, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 3.2, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 71.5543, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.5534, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 31.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 22.1667, + "eval_rougeL_for_title_generation": 3.2, + "eval_runtime": 47.216, + "eval_samples_per_second": 74.127, + "eval_steps_per_second": 1.165, + "step": 200 + }, + { + "epoch": 0.07, + "learning_rate": 5e-05, + "loss": 1.7406, + "step": 500 + }, + { + "epoch": 0.07, + "eval_exact_match": 45.6286, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 49.2667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 58.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 22.6667, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 49.876, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 52.8919, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 16.1737, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 73.2462, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.5102, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 25.7294, + "eval_f1_for_task534_farstail_textual_entailment": 34.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 30.9098, + "eval_f1_for_title_generation": 16.1737, + "eval_gen_len": 4.2251, + "eval_global_step": 500, + "eval_loss": 0.4882946312427521, + "eval_rouge1": 46.7309, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 50.3514, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.3726, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 72.734, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.8093, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.6667, + "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 22.8889, + "eval_rouge1_for_title_generation": 6.3726, + "eval_rougeL": 46.7252, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 50.3448, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.3726, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 72.734, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.6093, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.6667, + "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 22.8889, + "eval_rougeL_for_title_generation": 6.3726, + "eval_runtime": 51.2553, + "eval_samples_per_second": 68.286, + "eval_steps_per_second": 1.073, + "step": 500 + }, + { + "epoch": 0.13, + "learning_rate": 5e-05, + "loss": 1.5969, + "step": 1000 + }, + { + "epoch": 0.13, + "eval_exact_match": 44.4286, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 47.9333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 45.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 41.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 46.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 47.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 45.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 17.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 44.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 22.3333, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 48.7078, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 51.5153, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 45.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 41.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 46.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 47.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 16.7735, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 61.5139, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 32.9466, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 25.54, + "eval_f1_for_task534_farstail_textual_entailment": 34.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 44.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 30.8467, + "eval_f1_for_title_generation": 16.7735, + "eval_gen_len": 4.3826, + "eval_global_step": 1000, + "eval_loss": 0.47427454590797424, + "eval_rouge1": 45.5347, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 48.9838, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 45.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 41.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 46.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 47.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.7, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 61.3384, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 32.1749, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 44.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 22.8333, + "eval_rouge1_for_title_generation": 5.7, + "eval_rougeL": 45.5246, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 48.972, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 45.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 41.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 46.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 47.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.7, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 61.1846, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 31.9749, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 44.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 22.8333, + "eval_rougeL_for_title_generation": 5.7, + "eval_runtime": 60.9063, + "eval_samples_per_second": 57.465, + "eval_steps_per_second": 0.903, + "step": 1000 + }, + { + "epoch": 0.2, + "learning_rate": 5e-05, + "loss": 1.4937, + "step": 1500 + }, + { + "epoch": 0.2, + "eval_exact_match": 45.6571, + "eval_exact_match_for_answerability_classification": 49.0, + "eval_exact_match_for_cause_effect_classification": 49.3667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 44.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 42.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 40.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 46.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 33.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 48.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 49.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 22.3333, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 49.9636, + "eval_f1_for_answerability_classification": 49.0, + "eval_f1_for_cause_effect_classification": 52.7891, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 44.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 42.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 40.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 46.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.431, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.8772, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 47.7961, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 48.0, + "eval_f1_for_task396_persianqa_answerability_classification": 49.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.6215, + "eval_f1_for_task534_farstail_textual_entailment": 33.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 77.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 31.2072, + "eval_f1_for_title_generation": 22.431, + "eval_gen_len": 4.6006, + "eval_global_step": 1500, + "eval_loss": 0.4453420639038086, + "eval_rouge1": 46.7181, + "eval_rouge1_for_answerability_classification": 49.0, + "eval_rouge1_for_cause_effect_classification": 50.3361, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 44.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 42.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 40.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 46.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.5492, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.6298, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 47.4533, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 48.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 49.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 22.8333, + "eval_rouge1_for_title_generation": 7.5492, + "eval_rougeL": 46.7052, + "eval_rougeL_for_answerability_classification": 49.0, + "eval_rougeL_for_cause_effect_classification": 50.3294, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 44.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 42.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 40.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 46.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.2992, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.6298, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 47.2533, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 48.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 49.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 22.8333, + "eval_rougeL_for_title_generation": 7.2992, + "eval_runtime": 54.9496, + "eval_samples_per_second": 63.695, + "eval_steps_per_second": 1.001, + "step": 1500 + }, + { + "epoch": 0.27, + "learning_rate": 5e-05, + "loss": 1.4808, + "step": 2000 + }, + { + "epoch": 0.27, + "eval_exact_match": 46.4857, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 50.2333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 46.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 43.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 44.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 35.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_textual_entailment": 23.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 50.859, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 53.7262, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 46.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 43.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 44.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.6628, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.642, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 36.1429, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 35.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.6186, + "eval_f1_for_task534_farstail_textual_entailment": 33.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_textual_entailment": 31.8729, + "eval_f1_for_title_generation": 22.6628, + "eval_gen_len": 4.3834, + "eval_global_step": 2000, + "eval_loss": 0.4502388536930084, + "eval_rouge1": 47.5331, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 51.2125, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 46.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 43.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 44.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.7827, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.4834, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.8921, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 35.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_textual_entailment": 23.1667, + "eval_rouge1_for_title_generation": 7.7827, + "eval_rougeL": 47.5274, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 51.2059, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 46.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 43.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 44.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.7827, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.4834, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.6921, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 35.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_textual_entailment": 23.1667, + "eval_rougeL_for_title_generation": 7.7827, + "eval_runtime": 56.4908, + "eval_samples_per_second": 61.957, + "eval_steps_per_second": 0.974, + "step": 2000 + }, + { + "epoch": 0.33, + "learning_rate": 5e-05, + "loss": 1.4142, + "step": 2500 + }, + { + "epoch": 0.33, + "eval_exact_match": 45.9143, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 49.5667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_textual_entailment": 22.6667, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 49.9839, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 53.1953, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 11.6421, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.4947, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 37.3657, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 24.9355, + "eval_f1_for_task534_farstail_textual_entailment": 34.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_textual_entailment": 30.6452, + "eval_f1_for_title_generation": 11.6421, + "eval_gen_len": 3.8066, + "eval_global_step": 2500, + "eval_loss": 0.4557723104953766, + "eval_rouge1": 46.8499, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 50.6725, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 1.5714, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.4087, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 36.7677, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_textual_entailment": 22.6667, + "eval_rouge1_for_title_generation": 1.5714, + "eval_rougeL": 46.8385, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 50.6592, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 1.5714, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.2087, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 36.5677, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_textual_entailment": 22.6667, + "eval_rougeL_for_title_generation": 1.5714, + "eval_runtime": 52.9945, + "eval_samples_per_second": 66.045, + "eval_steps_per_second": 1.038, + "step": 2500 + }, + { + "epoch": 0.4, + "learning_rate": 5e-05, + "loss": 1.424, + "step": 3000 + }, + { + "epoch": 0.4, + "eval_exact_match": 45.2571, + "eval_exact_match_for_answerability_classification": 48.0, + "eval_exact_match_for_cause_effect_classification": 49.8, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 47.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 45.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 48.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 6.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 48.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_textual_entailment": 13.6667, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 49.544, + "eval_f1_for_answerability_classification": 48.0, + "eval_f1_for_cause_effect_classification": 53.3133, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 47.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 45.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 20.0148, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3859, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.012, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 51.0, + "eval_f1_for_task396_persianqa_answerability_classification": 48.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.628, + "eval_f1_for_task534_farstail_textual_entailment": 6.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 48.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_textual_entailment": 22.2093, + "eval_f1_for_title_generation": 20.0148, + "eval_gen_len": 4.2606, + "eval_global_step": 3000, + "eval_loss": 0.49717187881469727, + "eval_rouge1": 46.25, + "eval_rouge1_for_answerability_classification": 48.0, + "eval_rouge1_for_cause_effect_classification": 50.7961, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 47.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 45.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.8667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.3101, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.5737, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 51.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 48.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 6.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 48.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_textual_entailment": 13.6667, + "eval_rouge1_for_title_generation": 5.8667, + "eval_rougeL": 46.25, + "eval_rougeL_for_answerability_classification": 48.0, + "eval_rougeL_for_cause_effect_classification": 50.7961, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 47.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 45.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.8667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.3101, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.5737, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 51.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 48.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 6.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 48.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_textual_entailment": 13.6667, + "eval_rougeL_for_title_generation": 5.8667, + "eval_runtime": 51.2339, + "eval_samples_per_second": 68.314, + "eval_steps_per_second": 1.074, + "step": 3000 + }, + { + "epoch": 0.46, + "learning_rate": 5e-05, + "loss": 1.3657, + "step": 3500 + }, + { + "epoch": 0.46, + "eval_exact_match": 46.0, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 49.4333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 49.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 39.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 47.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 25.0, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 50.4343, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 53.0825, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.5353, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.5879, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.8877, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 39.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.1911, + "eval_f1_for_task534_farstail_textual_entailment": 35.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 73.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 33.397, + "eval_f1_for_title_generation": 22.5353, + "eval_gen_len": 4.2649, + "eval_global_step": 3500, + "eval_loss": 0.4972946345806122, + "eval_rouge1": 47.073, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 50.493, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.7667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.3856, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.4042, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 39.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 47.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 25.0, + "eval_rouge1_for_title_generation": 7.7667, + "eval_rougeL": 47.0673, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 50.4863, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.7667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.3856, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.2042, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 39.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 47.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 25.0, + "eval_rougeL_for_title_generation": 7.7667, + "eval_runtime": 50.353, + "eval_samples_per_second": 69.509, + "eval_steps_per_second": 1.092, + "step": 3500 + }, + { + "epoch": 0.53, + "learning_rate": 5e-05, + "loss": 1.3591, + "step": 4000 + }, + { + "epoch": 0.53, + "eval_exact_match": 45.0, + "eval_exact_match_for_answerability_classification": 53.0, + "eval_exact_match_for_cause_effect_classification": 49.5333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 53.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 0.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_textual_entailment": 11.6667, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 49.2805, + "eval_f1_for_answerability_classification": 53.0, + "eval_f1_for_cause_effect_classification": 53.0349, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 19.2178, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.9583, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 43.5893, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task396_persianqa_answerability_classification": 53.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.551, + "eval_f1_for_task534_farstail_textual_entailment": 0.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 77.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_textual_entailment": 20.517, + "eval_f1_for_title_generation": 19.2178, + "eval_gen_len": 4.3746, + "eval_global_step": 4000, + "eval_loss": 0.5541166067123413, + "eval_rouge1": 46.1285, + "eval_rouge1_for_answerability_classification": 53.0, + "eval_rouge1_for_cause_effect_classification": 50.6331, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.5048, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.8166, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.1766, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 53.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 0.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_textual_entailment": 11.6667, + "eval_rouge1_for_title_generation": 7.5048, + "eval_rougeL": 46.1228, + "eval_rougeL_for_answerability_classification": 53.0, + "eval_rougeL_for_cause_effect_classification": 50.6264, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.5048, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.8166, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.9766, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 53.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 0.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_textual_entailment": 11.6667, + "eval_rougeL_for_title_generation": 7.5048, + "eval_runtime": 56.9164, + "eval_samples_per_second": 61.494, + "eval_steps_per_second": 0.966, + "step": 4000 + }, + { + "epoch": 0.6, + "learning_rate": 5e-05, + "loss": 1.334, + "step": 4500 + }, + { + "epoch": 0.6, + "eval_exact_match": 48.1429, + "eval_exact_match_for_answerability_classification": 68.0, + "eval_exact_match_for_cause_effect_classification": 51.4667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 68.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 37.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_textual_entailment": 24.3333, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 52.5952, + "eval_f1_for_answerability_classification": 68.0, + "eval_f1_for_cause_effect_classification": 55.0366, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.4279, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 73.2258, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 35.8708, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task396_persianqa_answerability_classification": 68.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 37.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.3083, + "eval_f1_for_task534_farstail_textual_entailment": 35.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_textual_entailment": 32.7694, + "eval_f1_for_title_generation": 23.4279, + "eval_gen_len": 4.2037, + "eval_global_step": 4500, + "eval_loss": 0.44648101925849915, + "eval_rouge1": 49.2638, + "eval_rouge1_for_answerability_classification": 68.0, + "eval_rouge1_for_cause_effect_classification": 52.5205, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.95, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 73.343, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.2724, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 68.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 37.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.6667, + "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_textual_entailment": 24.5556, + "eval_rouge1_for_title_generation": 6.95, + "eval_rougeL": 49.2509, + "eval_rougeL_for_answerability_classification": 68.0, + "eval_rougeL_for_cause_effect_classification": 52.5138, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.7, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 73.343, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.0724, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 68.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 37.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.6667, + "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_textual_entailment": 24.5556, + "eval_rougeL_for_title_generation": 6.7, + "eval_runtime": 56.8208, + "eval_samples_per_second": 61.597, + "eval_steps_per_second": 0.968, + "step": 4500 + }, + { + "epoch": 0.66, + "learning_rate": 5e-05, + "loss": 1.3219, + "step": 5000 + }, + { + "epoch": 0.66, + "eval_exact_match": 45.7143, + "eval_exact_match_for_answerability_classification": 50.0, + "eval_exact_match_for_cause_effect_classification": 49.6667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 31.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 27.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_textual_entailment": 19.6667, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 50.1301, + "eval_f1_for_answerability_classification": 50.0, + "eval_f1_for_cause_effect_classification": 53.2505, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.1179, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.5094, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 36.0067, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task396_persianqa_answerability_classification": 50.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 31.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.9195, + "eval_f1_for_task534_farstail_textual_entailment": 27.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_textual_entailment": 28.6398, + "eval_f1_for_title_generation": 21.1179, + "eval_gen_len": 4.4071, + "eval_global_step": 5000, + "eval_loss": 0.5046093463897705, + "eval_rouge1": 46.8082, + "eval_rouge1_for_answerability_classification": 50.0, + "eval_rouge1_for_cause_effect_classification": 50.7351, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.7333, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.4986, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.5551, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 31.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 27.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_textual_entailment": 19.8333, + "eval_rouge1_for_title_generation": 6.7333, + "eval_rougeL": 46.8025, + "eval_rougeL_for_answerability_classification": 50.0, + "eval_rougeL_for_cause_effect_classification": 50.7285, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.7333, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.2986, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.5551, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 31.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 27.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_textual_entailment": 19.8333, + "eval_rougeL_for_title_generation": 6.7333, + "eval_runtime": 52.9633, + "eval_samples_per_second": 66.084, + "eval_steps_per_second": 1.038, + "step": 5000 + }, + { + "epoch": 0.73, + "learning_rate": 5e-05, + "loss": 1.2949, + "step": 5500 + }, + { + "epoch": 0.73, + "eval_exact_match": 47.8, + "eval_exact_match_for_answerability_classification": 57.0, + "eval_exact_match_for_cause_effect_classification": 51.2333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 49.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 32.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 45.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_textual_entailment": 26.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 52.1079, + "eval_f1_for_answerability_classification": 57.0, + "eval_f1_for_cause_effect_classification": 54.6733, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.96, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.4703, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.7293, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_f1_for_task396_persianqa_answerability_classification": 57.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 32.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.6166, + "eval_f1_for_task534_farstail_textual_entailment": 45.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_textual_entailment": 34.8722, + "eval_f1_for_title_generation": 21.96, + "eval_gen_len": 4.344, + "eval_global_step": 5500, + "eval_loss": 0.5085814595222473, + "eval_rouge1": 48.773, + "eval_rouge1_for_answerability_classification": 57.0, + "eval_rouge1_for_cause_effect_classification": 52.1813, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.6167, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.3426, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.0955, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 32.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 45.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_textual_entailment": 26.0, + "eval_rouge1_for_title_generation": 6.6167, + "eval_rougeL": 48.773, + "eval_rougeL_for_answerability_classification": 57.0, + "eval_rougeL_for_cause_effect_classification": 52.1813, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 65.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.6167, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.3426, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.0955, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 32.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 45.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_textual_entailment": 26.0, + "eval_rougeL_for_title_generation": 6.6167, + "eval_runtime": 54.0521, + "eval_samples_per_second": 64.752, + "eval_steps_per_second": 1.018, + "step": 5500 + }, + { + "epoch": 0.8, + "learning_rate": 5e-05, + "loss": 1.3032, + "step": 6000 + }, + { + "epoch": 0.8, + "eval_exact_match": 48.0286, + "eval_exact_match_for_answerability_classification": 52.0, + "eval_exact_match_for_cause_effect_classification": 51.6667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 66.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 46.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 17.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 52.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_textual_entailment": 26.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 52.5448, + "eval_f1_for_answerability_classification": 52.0, + "eval_f1_for_cause_effect_classification": 55.2346, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 66.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.2404, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.1301, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 46.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 34.407, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_f1_for_task396_persianqa_answerability_classification": 52.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.7902, + "eval_f1_for_task534_farstail_textual_entailment": 35.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 79.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_textual_entailment": 34.9301, + "eval_f1_for_title_generation": 25.2404, + "eval_gen_len": 4.1863, + "eval_global_step": 6000, + "eval_loss": 0.49761494994163513, + "eval_rouge1": 49.2271, + "eval_rouge1_for_answerability_classification": 52.0, + "eval_rouge1_for_cause_effect_classification": 52.829, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 66.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.0778, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.6839, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 46.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 34.1859, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 52.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_textual_entailment": 26.3333, + "eval_rouge1_for_title_generation": 7.0778, + "eval_rougeL": 49.2156, + "eval_rougeL_for_answerability_classification": 52.0, + "eval_rougeL_for_cause_effect_classification": 52.8157, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 66.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.0778, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.4839, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 46.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 33.9859, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 55.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 52.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_textual_entailment": 26.3333, + "eval_rougeL_for_title_generation": 7.0778, + "eval_runtime": 48.9982, + "eval_samples_per_second": 71.431, + "eval_steps_per_second": 1.122, + "step": 6000 + }, + { + "epoch": 0.86, + "learning_rate": 5e-05, + "loss": 1.3026, + "step": 6500 + }, + { + "epoch": 0.86, + "eval_exact_match": 47.2857, + "eval_exact_match_for_answerability_classification": 63.0, + "eval_exact_match_for_cause_effect_classification": 50.2333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 23.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 63.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 48.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_textual_entailment": 27.6667, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 51.8128, + "eval_f1_for_answerability_classification": 63.0, + "eval_f1_for_cause_effect_classification": 53.8076, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 26.241, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.4594, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.7673, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task396_persianqa_answerability_classification": 63.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 48.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.9787, + "eval_f1_for_task534_farstail_textual_entailment": 34.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 49.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_textual_entailment": 36.6596, + "eval_f1_for_title_generation": 26.241, + "eval_gen_len": 4.2337, + "eval_global_step": 6500, + "eval_loss": 0.4878259003162384, + "eval_rouge1": 48.4413, + "eval_rouge1_for_answerability_classification": 63.0, + "eval_rouge1_for_cause_effect_classification": 51.2755, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.1803, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.0246, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 38.2396, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 63.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 48.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_textual_entailment": 28.0, + "eval_rouge1_for_title_generation": 10.1803, + "eval_rougeL": 48.4084, + "eval_rougeL_for_answerability_classification": 63.0, + "eval_rougeL_for_cause_effect_classification": 51.2621, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.4303, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.8246, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 38.0396, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 63.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 48.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_textual_entailment": 28.0, + "eval_rougeL_for_title_generation": 9.4303, + "eval_runtime": 55.9532, + "eval_samples_per_second": 62.552, + "eval_steps_per_second": 0.983, + "step": 6500 + }, + { + "epoch": 0.93, + "learning_rate": 5e-05, + "loss": 1.3001, + "step": 7000 + }, + { + "epoch": 0.93, + "eval_exact_match": 48.4, + "eval_exact_match_for_answerability_classification": 59.0, + "eval_exact_match_for_cause_effect_classification": 52.1333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 28.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 59.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_textual_entailment": 22.6667, + "eval_exact_match_for_title_generation": 3.0, + "eval_f1": 52.9111, + "eval_f1_for_answerability_classification": 59.0, + "eval_f1_for_cause_effect_classification": 55.7378, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.1245, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 71.3489, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 43.7847, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_f1_for_task396_persianqa_answerability_classification": 59.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 28.6292, + "eval_f1_for_task534_farstail_textual_entailment": 33.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_textual_entailment": 31.8764, + "eval_f1_for_title_generation": 25.1245, + "eval_gen_len": 4.2043, + "eval_global_step": 7000, + "eval_loss": 0.502213180065155, + "eval_rouge1": 49.4586, + "eval_rouge1_for_answerability_classification": 59.0, + "eval_rouge1_for_cause_effect_classification": 53.215, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.6, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 71.0823, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.367, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 59.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_textual_entailment": 22.6667, + "eval_rouge1_for_title_generation": 7.6, + "eval_rougeL": 49.4471, + "eval_rougeL_for_answerability_classification": 59.0, + "eval_rougeL_for_cause_effect_classification": 53.2016, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.6, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.8823, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 43.167, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 59.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_textual_entailment": 22.6667, + "eval_rougeL_for_title_generation": 7.6, + "eval_runtime": 52.3007, + "eval_samples_per_second": 66.921, + "eval_steps_per_second": 1.052, + "step": 7000 + }, + { + "epoch": 1.0, + "learning_rate": 5e-05, + "loss": 1.2703, + "step": 7500 + }, + { + "epoch": 1.0, + "eval_exact_match": 45.5429, + "eval_exact_match_for_answerability_classification": 57.0, + "eval_exact_match_for_cause_effect_classification": 49.9333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 24.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 35.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 3.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_textual_entailment": 12.6667, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 50.0887, + "eval_f1_for_answerability_classification": 57.0, + "eval_f1_for_cause_effect_classification": 53.5186, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.1866, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.9928, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.5649, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task396_persianqa_answerability_classification": 57.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 35.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.361, + "eval_f1_for_task534_farstail_textual_entailment": 3.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_textual_entailment": 21.787, + "eval_f1_for_title_generation": 25.1866, + "eval_gen_len": 4.4051, + "eval_global_step": 7500, + "eval_loss": 0.5247823596000671, + "eval_rouge1": 46.6911, + "eval_rouge1_for_answerability_classification": 57.0, + "eval_rouge1_for_cause_effect_classification": 50.9887, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 8.5273, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.7567, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.9049, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 35.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 3.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_textual_entailment": 13.0, + "eval_rouge1_for_title_generation": 8.5273, + "eval_rougeL": 46.6725, + "eval_rougeL_for_answerability_classification": 57.0, + "eval_rougeL_for_cause_effect_classification": 50.9754, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 8.2773, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.5567, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.7049, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 35.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 3.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_textual_entailment": 13.0, + "eval_rougeL_for_title_generation": 8.2773, + "eval_runtime": 53.4229, + "eval_samples_per_second": 65.515, + "eval_steps_per_second": 1.03, + "step": 7500 + }, + { + "epoch": 1.06, + "learning_rate": 5e-05, + "loss": 1.0752, + "step": 8000 + }, + { + "epoch": 1.06, + "eval_exact_match": 49.6286, + "eval_exact_match_for_answerability_classification": 64.0, + "eval_exact_match_for_cause_effect_classification": 53.0667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 59.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 57.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_textual_entailment": 26.3333, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 54.0585, + "eval_f1_for_answerability_classification": 64.0, + "eval_f1_for_cause_effect_classification": 56.6185, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 24.7119, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.9217, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.134, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 59.0, + "eval_f1_for_task396_persianqa_answerability_classification": 64.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.7787, + "eval_f1_for_task534_farstail_textual_entailment": 33.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 57.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_textual_entailment": 34.9262, + "eval_f1_for_title_generation": 24.7119, + "eval_gen_len": 4.2411, + "eval_global_step": 8000, + "eval_loss": 0.48732811212539673, + "eval_rouge1": 50.7222, + "eval_rouge1_for_answerability_classification": 64.0, + "eval_rouge1_for_cause_effect_classification": 54.1718, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.1237, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.4976, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.6573, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 59.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 57.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_textual_entailment": 26.3333, + "eval_rouge1_for_title_generation": 7.1237, + "eval_rougeL": 50.7222, + "eval_rougeL_for_answerability_classification": 64.0, + "eval_rougeL_for_cause_effect_classification": 54.1718, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 47.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 68.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.1237, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.4976, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.6573, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 59.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 57.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_textual_entailment": 26.3333, + "eval_rougeL_for_title_generation": 7.1237, + "eval_runtime": 51.5603, + "eval_samples_per_second": 67.882, + "eval_steps_per_second": 1.067, + "step": 8000 + }, + { + "epoch": 1.13, + "learning_rate": 5e-05, + "loss": 1.0244, + "step": 8500 + }, + { + "epoch": 1.13, + "eval_exact_match": 48.1143, + "eval_exact_match_for_answerability_classification": 62.0, + "eval_exact_match_for_cause_effect_classification": 52.2, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 40.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 23.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 23.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 48.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 48.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_textual_entailment": 18.6667, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 52.8712, + "eval_f1_for_answerability_classification": 62.0, + "eval_f1_for_cause_effect_classification": 56.0091, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 26.6965, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 60.2113, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.5611, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_f1_for_task396_persianqa_answerability_classification": 62.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 25.5214, + "eval_f1_for_task534_farstail_textual_entailment": 23.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 74.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_textual_entailment": 27.1738, + "eval_f1_for_title_generation": 26.6965, + "eval_gen_len": 4.112, + "eval_global_step": 8500, + "eval_loss": 0.5391484498977661, + "eval_rouge1": 49.5027, + "eval_rouge1_for_answerability_classification": 62.0, + "eval_rouge1_for_cause_effect_classification": 53.4298, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.2, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 59.8095, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.084, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 23.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 48.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 48.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_textual_entailment": 19.1667, + "eval_rouge1_for_title_generation": 10.2, + "eval_rougeL": 49.5027, + "eval_rougeL_for_answerability_classification": 62.0, + "eval_rougeL_for_cause_effect_classification": 53.4298, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 10.2, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 59.8095, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.084, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 23.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 48.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 48.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_textual_entailment": 19.1667, + "eval_rougeL_for_title_generation": 10.2, + "eval_runtime": 51.3401, + "eval_samples_per_second": 68.173, + "eval_steps_per_second": 1.071, + "step": 8500 + }, + { + "epoch": 1.2, + "learning_rate": 5e-05, + "loss": 1.0551, + "step": 9000 + }, + { + "epoch": 1.2, + "eval_exact_match": 48.1143, + "eval_exact_match_for_answerability_classification": 71.0, + "eval_exact_match_for_cause_effect_classification": 51.1667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 55.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 71.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 30.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 55.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 56.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_textual_entailment": 25.0, + "eval_exact_match_for_title_generation": 3.0, + "eval_f1": 52.7162, + "eval_f1_for_answerability_classification": 71.0, + "eval_f1_for_cause_effect_classification": 54.7681, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 27.3639, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.3176, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 55.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.7249, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_f1_for_task396_persianqa_answerability_classification": 71.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 28.659, + "eval_f1_for_task534_farstail_textual_entailment": 30.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 55.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 56.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_textual_entailment": 34.553, + "eval_f1_for_title_generation": 27.3639, + "eval_gen_len": 4.5371, + "eval_global_step": 9000, + "eval_loss": 0.5095714330673218, + "eval_rouge1": 49.3168, + "eval_rouge1_for_answerability_classification": 71.0, + "eval_rouge1_for_cause_effect_classification": 52.28, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.1889, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.954, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 55.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.4462, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 71.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 30.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 55.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 56.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_textual_entailment": 25.5, + "eval_rouge1_for_title_generation": 10.1889, + "eval_rougeL": 49.3111, + "eval_rougeL_for_answerability_classification": 71.0, + "eval_rougeL_for_cause_effect_classification": 52.2733, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 10.1889, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.954, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 55.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.2462, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 71.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 30.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 55.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 56.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_textual_entailment": 25.5, + "eval_rougeL_for_title_generation": 10.1889, + "eval_runtime": 55.8217, + "eval_samples_per_second": 62.7, + "eval_steps_per_second": 0.985, + "step": 9000 + }, + { + "epoch": 1.26, + "learning_rate": 5e-05, + "loss": 1.073, + "step": 9500 + }, + { + "epoch": 1.26, + "eval_exact_match": 49.2286, + "eval_exact_match_for_answerability_classification": 61.0, + "eval_exact_match_for_cause_effect_classification": 52.7667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 63.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 61.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 46.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 32.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 55.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_textual_entailment": 26.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 53.4079, + "eval_f1_for_answerability_classification": 61.0, + "eval_f1_for_cause_effect_classification": 56.0202, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 63.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.0851, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3659, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.7402, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_f1_for_task396_persianqa_answerability_classification": 61.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 46.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.5864, + "eval_f1_for_task534_farstail_textual_entailment": 32.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 77.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 79.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_textual_entailment": 34.8621, + "eval_f1_for_title_generation": 23.0851, + "eval_gen_len": 4.1429, + "eval_global_step": 9500, + "eval_loss": 0.5040011405944824, + "eval_rouge1": 50.2692, + "eval_rouge1_for_answerability_classification": 61.0, + "eval_rouge1_for_cause_effect_classification": 53.7452, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 63.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.5667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.0282, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.3278, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 61.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 32.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 55.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_textual_entailment": 26.5, + "eval_rouge1_for_title_generation": 6.5667, + "eval_rougeL": 50.2635, + "eval_rougeL_for_answerability_classification": 61.0, + "eval_rougeL_for_cause_effect_classification": 53.7385, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 63.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.5667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.0282, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.1278, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 61.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 32.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 55.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_textual_entailment": 26.5, + "eval_rougeL_for_title_generation": 6.5667, + "eval_runtime": 50.7287, + "eval_samples_per_second": 68.994, + "eval_steps_per_second": 1.084, + "step": 9500 + }, + { + "epoch": 1.33, + "learning_rate": 5e-05, + "loss": 1.0736, + "step": 10000 + }, + { + "epoch": 1.33, + "eval_exact_match": 49.7143, + "eval_exact_match_for_answerability_classification": 67.0, + "eval_exact_match_for_cause_effect_classification": 53.3, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 65.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 67.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 47.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 25.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 65.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_textual_entailment": 24.3333, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 54.0982, + "eval_f1_for_answerability_classification": 67.0, + "eval_f1_for_cause_effect_classification": 56.8652, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 65.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.1284, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.2905, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.1648, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task396_persianqa_answerability_classification": 67.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 47.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 25.3545, + "eval_f1_for_task534_farstail_textual_entailment": 25.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 65.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_textual_entailment": 32.4515, + "eval_f1_for_title_generation": 23.1284, + "eval_gen_len": 4.2194, + "eval_global_step": 10000, + "eval_loss": 0.5591691136360168, + "eval_rouge1": 50.9114, + "eval_rouge1_for_answerability_classification": 67.0, + "eval_rouge1_for_cause_effect_classification": 54.3911, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 65.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 9.1667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 63.9211, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.8107, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 67.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 47.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 25.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 65.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_textual_entailment": 24.6667, + "eval_rouge1_for_title_generation": 9.1667, + "eval_rougeL": 50.9114, + "eval_rougeL_for_answerability_classification": 67.0, + "eval_rougeL_for_cause_effect_classification": 54.3911, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 65.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.1667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 63.9211, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.8107, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 67.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 47.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 25.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 65.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_textual_entailment": 24.6667, + "eval_rougeL_for_title_generation": 9.1667, + "eval_runtime": 53.0747, + "eval_samples_per_second": 65.945, + "eval_steps_per_second": 1.036, + "step": 10000 + }, + { + "epoch": 1.39, + "learning_rate": 5e-05, + "loss": 1.0635, + "step": 10500 + }, + { + "epoch": 1.39, + "eval_exact_match": 49.4286, + "eval_exact_match_for_answerability_classification": 60.0, + "eval_exact_match_for_cause_effect_classification": 52.8, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 58.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 62.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 60.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 46.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 39.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 47.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_textual_entailment": 28.6667, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 53.8781, + "eval_f1_for_answerability_classification": 60.0, + "eval_f1_for_cause_effect_classification": 56.337, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.1671, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 74.3401, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 44.7686, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 62.0, + "eval_f1_for_task396_persianqa_answerability_classification": 60.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 46.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.4562, + "eval_f1_for_task534_farstail_textual_entailment": 39.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 47.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_textual_entailment": 37.4854, + "eval_f1_for_title_generation": 23.1671, + "eval_gen_len": 4.2829, + "eval_global_step": 10500, + "eval_loss": 0.5000580549240112, + "eval_rouge1": 50.5195, + "eval_rouge1_for_answerability_classification": 60.0, + "eval_rouge1_for_cause_effect_classification": 53.8171, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.6667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 74.2116, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 44.3028, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 62.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 60.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 39.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 47.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_textual_entailment": 28.6667, + "eval_rouge1_for_title_generation": 7.6667, + "eval_rougeL": 50.5195, + "eval_rougeL_for_answerability_classification": 60.0, + "eval_rougeL_for_cause_effect_classification": 53.8171, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.6667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 74.2116, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 44.3028, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 62.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 60.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 39.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 47.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_textual_entailment": 28.6667, + "eval_rougeL_for_title_generation": 7.6667, + "eval_runtime": 56.3252, + "eval_samples_per_second": 62.139, + "eval_steps_per_second": 0.976, + "step": 10500 + }, + { + "epoch": 1.46, + "learning_rate": 5e-05, + "loss": 1.0416, + "step": 11000 + }, + { + "epoch": 1.46, + "eval_exact_match": 49.9714, + "eval_exact_match_for_answerability_classification": 64.0, + "eval_exact_match_for_cause_effect_classification": 53.5333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 70.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 63.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 41.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 36.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 48.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_textual_entailment": 26.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 54.3691, + "eval_f1_for_answerability_classification": 64.0, + "eval_f1_for_cause_effect_classification": 57.1392, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 70.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 63.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 20.8497, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 72.8568, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.8202, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task396_persianqa_answerability_classification": 64.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 41.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.8933, + "eval_f1_for_task534_farstail_textual_entailment": 36.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 74.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_textual_entailment": 34.6311, + "eval_f1_for_title_generation": 20.8497, + "eval_gen_len": 4.2114, + "eval_global_step": 11000, + "eval_loss": 0.5632901787757874, + "eval_rouge1": 51.059, + "eval_rouge1_for_answerability_classification": 64.0, + "eval_rouge1_for_cause_effect_classification": 54.596, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 70.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 63.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.1857, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 72.6155, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.2633, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 41.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 36.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 48.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_textual_entailment": 26.0, + "eval_rouge1_for_title_generation": 7.1857, + "eval_rougeL": 51.0533, + "eval_rougeL_for_answerability_classification": 64.0, + "eval_rougeL_for_cause_effect_classification": 54.5893, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 70.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 63.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.1857, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 72.6155, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.0633, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 41.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 36.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 48.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_textual_entailment": 26.0, + "eval_rougeL_for_title_generation": 7.1857, + "eval_runtime": 50.6144, + "eval_samples_per_second": 69.15, + "eval_steps_per_second": 1.087, + "step": 11000 + }, + { + "epoch": 1.53, + "learning_rate": 5e-05, + "loss": 1.0416, + "step": 11500 + }, + { + "epoch": 1.53, + "eval_exact_match": 47.5714, + "eval_exact_match_for_answerability_classification": 76.0, + "eval_exact_match_for_cause_effect_classification": 51.2333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 21.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 76.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 37.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 14.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 56.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_textual_entailment": 17.3333, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 52.1909, + "eval_f1_for_answerability_classification": 76.0, + "eval_f1_for_cause_effect_classification": 54.9215, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.6704, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3374, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.3061, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_f1_for_task396_persianqa_answerability_classification": 76.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 37.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 28.3691, + "eval_f1_for_task534_farstail_textual_entailment": 14.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 56.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_textual_entailment": 26.4564, + "eval_f1_for_title_generation": 23.6704, + "eval_gen_len": 4.6251, + "eval_global_step": 11500, + "eval_loss": 0.49266964197158813, + "eval_rouge1": 48.7653, + "eval_rouge1_for_answerability_classification": 76.0, + "eval_rouge1_for_cause_effect_classification": 52.3959, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.4111, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.1104, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 39.7656, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 76.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 37.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 14.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 56.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_textual_entailment": 17.5, + "eval_rouge1_for_title_generation": 6.4111, + "eval_rougeL": 48.7609, + "eval_rougeL_for_answerability_classification": 76.0, + "eval_rougeL_for_cause_effect_classification": 52.3907, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.4111, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 66.9565, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 39.7656, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 76.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 37.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 14.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 56.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_textual_entailment": 17.5, + "eval_rougeL_for_title_generation": 6.4111, + "eval_runtime": 55.2074, + "eval_samples_per_second": 63.397, + "eval_steps_per_second": 0.996, + "step": 11500 + }, + { + "epoch": 1.59, + "learning_rate": 5e-05, + "loss": 1.0514, + "step": 12000 + }, + { + "epoch": 1.59, + "eval_exact_match": 49.5714, + "eval_exact_match_for_answerability_classification": 74.0, + "eval_exact_match_for_cause_effect_classification": 52.5667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 64.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 55.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 31.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 74.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 41.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 60.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_textual_entailment": 28.0, + "eval_exact_match_for_title_generation": 0.0, + "eval_f1": 53.9068, + "eval_f1_for_answerability_classification": 74.0, + "eval_f1_for_cause_effect_classification": 56.0614, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 64.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.0096, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.7858, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.0563, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task396_persianqa_answerability_classification": 74.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 25.8876, + "eval_f1_for_task534_farstail_textual_entailment": 41.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 60.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_textual_entailment": 36.2959, + "eval_f1_for_title_generation": 22.0096, + "eval_gen_len": 4.0271, + "eval_global_step": 12000, + "eval_loss": 0.47120869159698486, + "eval_rouge1": 50.6592, + "eval_rouge1_for_answerability_classification": 74.0, + "eval_rouge1_for_cause_effect_classification": 53.5865, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 64.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.9778, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.6986, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 45.8955, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 74.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 41.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 60.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_textual_entailment": 28.1667, + "eval_rouge1_for_title_generation": 6.9778, + "eval_rougeL": 50.6535, + "eval_rougeL_for_answerability_classification": 74.0, + "eval_rougeL_for_cause_effect_classification": 53.5798, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 64.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.9778, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.6986, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.6955, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 74.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 41.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 60.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_textual_entailment": 28.1667, + "eval_rougeL_for_title_generation": 6.9778, + "eval_runtime": 49.3521, + "eval_samples_per_second": 70.919, + "eval_steps_per_second": 1.114, + "step": 12000 + }, + { + "epoch": 1.66, + "learning_rate": 5e-05, + "loss": 1.0451, + "step": 12500 + }, + { + "epoch": 1.66, + "eval_exact_match": 47.8, + "eval_exact_match_for_answerability_classification": 64.0, + "eval_exact_match_for_cause_effect_classification": 51.0333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 31.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_textual_entailment": 25.3333, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 52.3423, + "eval_f1_for_answerability_classification": 64.0, + "eval_f1_for_cause_effect_classification": 54.7372, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.1545, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.4465, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.6682, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task396_persianqa_answerability_classification": 64.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.7129, + "eval_f1_for_task534_farstail_textual_entailment": 34.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_textual_entailment": 34.571, + "eval_f1_for_title_generation": 22.1545, + "eval_gen_len": 4.6566, + "eval_global_step": 12500, + "eval_loss": 0.5286997556686401, + "eval_rouge1": 48.9372, + "eval_rouge1_for_answerability_classification": 64.0, + "eval_rouge1_for_cause_effect_classification": 52.2161, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.319, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.285, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 46.1972, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_textual_entailment": 25.6667, + "eval_rouge1_for_title_generation": 5.319, + "eval_rougeL": 48.9214, + "eval_rougeL_for_answerability_classification": 64.0, + "eval_rougeL_for_cause_effect_classification": 52.1976, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.319, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.9312, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.9972, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_textual_entailment": 25.6667, + "eval_rougeL_for_title_generation": 5.319, + "eval_runtime": 57.801, + "eval_samples_per_second": 60.553, + "eval_steps_per_second": 0.952, + "step": 12500 + }, + { + "epoch": 1.73, + "learning_rate": 5e-05, + "loss": 1.0371, + "step": 13000 + }, + { + "epoch": 1.73, + "eval_exact_match": 48.1143, + "eval_exact_match_for_answerability_classification": 62.0, + "eval_exact_match_for_cause_effect_classification": 52.1333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 34.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 10.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 59.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_textual_entailment": 18.6667, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 52.5387, + "eval_f1_for_answerability_classification": 62.0, + "eval_f1_for_cause_effect_classification": 55.6905, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.0795, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.517, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 48.1994, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_f1_for_task396_persianqa_answerability_classification": 62.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 29.057, + "eval_f1_for_task534_farstail_textual_entailment": 10.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 59.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_textual_entailment": 28.019, + "eval_f1_for_title_generation": 22.0795, + "eval_gen_len": 4.4326, + "eval_global_step": 13000, + "eval_loss": 0.5131350159645081, + "eval_rouge1": 49.2131, + "eval_rouge1_for_answerability_classification": 62.0, + "eval_rouge1_for_cause_effect_classification": 53.1587, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 9.697, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.1421, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 47.6192, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 10.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 59.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_textual_entailment": 18.6667, + "eval_rouge1_for_title_generation": 9.697, + "eval_rougeL": 49.2002, + "eval_rougeL_for_answerability_classification": 62.0, + "eval_rougeL_for_cause_effect_classification": 53.152, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.447, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.1421, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 47.4192, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 10.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 59.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_textual_entailment": 18.6667, + "eval_rougeL_for_title_generation": 9.447, + "eval_runtime": 52.3408, + "eval_samples_per_second": 66.869, + "eval_steps_per_second": 1.051, + "step": 13000 + }, + { + "epoch": 1.79, + "learning_rate": 5e-05, + "loss": 1.0494, + "step": 13500 + }, + { + "epoch": 1.79, + "eval_exact_match": 48.2857, + "eval_exact_match_for_answerability_classification": 58.0, + "eval_exact_match_for_cause_effect_classification": 51.9, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 58.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 30.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_textual_entailment": 24.3333, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 52.5952, + "eval_f1_for_answerability_classification": 58.0, + "eval_f1_for_cause_effect_classification": 55.3688, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.267, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 66.5262, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.5375, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_f1_for_task396_persianqa_answerability_classification": 58.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 27.5012, + "eval_f1_for_task534_farstail_textual_entailment": 30.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 58.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_textual_entailment": 33.1671, + "eval_f1_for_title_generation": 22.267, + "eval_gen_len": 4.0611, + "eval_global_step": 13500, + "eval_loss": 0.5875681042671204, + "eval_rouge1": 49.2211, + "eval_rouge1_for_answerability_classification": 58.0, + "eval_rouge1_for_cause_effect_classification": 52.8555, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.5744, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 66.5884, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.0767, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 58.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 30.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_textual_entailment": 24.5, + "eval_rouge1_for_title_generation": 5.5744, + "eval_rougeL": 49.2154, + "eval_rougeL_for_answerability_classification": 58.0, + "eval_rougeL_for_cause_effect_classification": 52.8488, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.5744, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 66.5884, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.8767, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 58.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 30.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_textual_entailment": 24.5, + "eval_rougeL_for_title_generation": 5.5744, + "eval_runtime": 48.6475, + "eval_samples_per_second": 71.946, + "eval_steps_per_second": 1.131, + "step": 13500 + }, + { + "epoch": 1.86, + "learning_rate": 5e-05, + "loss": 1.0335, + "step": 14000 + }, + { + "epoch": 1.86, + "eval_exact_match": 49.2286, + "eval_exact_match_for_answerability_classification": 62.0, + "eval_exact_match_for_cause_effect_classification": 53.3333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 59.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 62.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 17.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 42.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_exact_match_for_textual_entailment": 20.0, + "eval_exact_match_for_title_generation": 1.0, + "eval_f1": 53.4981, + "eval_f1_for_answerability_classification": 62.0, + "eval_f1_for_cause_effect_classification": 56.6994, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 59.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 62.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.2075, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.3948, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.587, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_f1_for_task396_persianqa_answerability_classification": 62.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 17.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 28.2439, + "eval_f1_for_task534_farstail_textual_entailment": 42.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 77.0, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 54.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 77.0, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_f1_for_textual_entailment": 29.0813, + "eval_f1_for_title_generation": 22.2075, + "eval_gen_len": 4.2831, + "eval_global_step": 14000, + "eval_loss": 0.5322003364562988, + "eval_rouge1": 50.8699, + "eval_rouge1_for_answerability_classification": 62.0, + "eval_rouge1_for_cause_effect_classification": 54.3127, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 59.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 62.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.5667, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.2851, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.0959, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 40.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 42.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rouge1_for_textual_entailment": 27.8333, + "eval_rouge1_for_title_generation": 5.5667, + "eval_rougeL": 50.8699, + "eval_rougeL_for_answerability_classification": 62.0, + "eval_rougeL_for_cause_effect_classification": 54.3127, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 59.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 62.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.5667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.2851, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.0959, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 60.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 40.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 42.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 54.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, + "eval_rougeL_for_textual_entailment": 27.8333, + "eval_rougeL_for_title_generation": 5.5667, + "eval_runtime": 55.1998, + "eval_samples_per_second": 63.406, + "eval_steps_per_second": 0.996, + "step": 14000 + }, + { + "epoch": 1.93, + "learning_rate": 5e-05, + "loss": 1.0581, + "step": 14500 + }, + { + "epoch": 1.93, + "eval_exact_match": 49.6857, + "eval_exact_match_for_answerability_classification": 60.0, + "eval_exact_match_for_cause_effect_classification": 53.9333, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 67.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 64.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 48.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 33.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 60.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 14.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 44.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 57.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 61.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 66.0, + "eval_exact_match_for_textual_entailment": 19.6667, + "eval_exact_match_for_title_generation": 2.0, + "eval_f1": 53.6169, + "eval_f1_for_answerability_classification": 60.0, + "eval_f1_for_cause_effect_classification": 57.036, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 67.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 64.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.3724, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 63.5684, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.0115, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_f1_for_task396_persianqa_answerability_classification": 60.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 14.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.1387, + "eval_f1_for_task534_farstail_textual_entailment": 44.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 78.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 80.5, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 76.5, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 66.0, + "eval_f1_for_textual_entailment": 28.0462, + "eval_f1_for_title_generation": 21.3724, + "eval_gen_len": 4.0269, + "eval_global_step": 14500, + "eval_loss": 0.5212923884391785, + "eval_rouge1": 51.347, + "eval_rouge1_for_answerability_classification": 60.0, + "eval_rouge1_for_cause_effect_classification": 54.8696, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 67.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 64.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.0571, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 63.5303, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 45.5583, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 60.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 40.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rouge1_for_task534_farstail_textual_entailment": 44.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 57.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 61.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 66.0, + "eval_rouge1_for_textual_entailment": 28.3333, + "eval_rouge1_for_title_generation": 6.0571, + "eval_rougeL": 51.347, + "eval_rougeL_for_answerability_classification": 60.0, + "eval_rougeL_for_cause_effect_classification": 54.8696, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 67.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 64.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.0571, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 63.5303, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 58.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.5583, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 60.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 40.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, + "eval_rougeL_for_task534_farstail_textual_entailment": 44.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 57.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 61.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 66.0, + "eval_rougeL_for_textual_entailment": 28.3333, + "eval_rougeL_for_title_generation": 6.0571, + "eval_runtime": 50.3438, + "eval_samples_per_second": 69.522, + "eval_steps_per_second": 1.092, + "step": 14500 + }, + { + "epoch": 1.99, + "learning_rate": 5e-05, + "loss": 1.0392, + "step": 15000 + }, + { + "epoch": 1.99, + "eval_exact_match": 47.5429, + "eval_exact_match_for_answerability_classification": 57.0, + "eval_exact_match_for_cause_effect_classification": 52.2667, + "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, + "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, + "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 57.0, + "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, + "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 58.0, + "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, + "eval_exact_match_for_task463_pasinlu_textual_entailment": 19.0, + "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, + "eval_exact_match_for_task534_farstail_textual_entailment": 16.0, + "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 55.0, + "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_exact_match_for_textual_entailment": 12.0, + "eval_exact_match_for_title_generation": 3.0, + "eval_f1": 51.8895, + "eval_f1_for_answerability_classification": 57.0, + "eval_f1_for_cause_effect_classification": 55.7605, + "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_f1_for_task1561_clickbait_news_bg_title_generation": 24.7349, + "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.2892, + "eval_f1_for_task1627_copa_hr_cause_effect_classification": 57.0, + "eval_f1_for_task1628_copa_hr_cause_effect_classification": 44.5254, + "eval_f1_for_task1629_copa_hr_cause_effect_classification": 58.0, + "eval_f1_for_task396_persianqa_answerability_classification": 57.0, + "eval_f1_for_task463_pasinlu_textual_entailment": 19.0, + "eval_f1_for_task464_pasinlu_textual_entailment": 26.5846, + "eval_f1_for_task534_farstail_textual_entailment": 16.0, + "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.5, + "eval_f1_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_f1_for_task940_indicnlp_cause_effect_classification": 76.0, + "eval_f1_for_task941_indicnlp_cause_effect_classification": 55.0, + "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, + "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_f1_for_textual_entailment": 20.5282, + "eval_f1_for_title_generation": 24.7349, + "eval_gen_len": 4.1929, + "eval_global_step": 15000, + "eval_loss": 0.5555234551429749, + "eval_rouge1": 49.3924, + "eval_rouge1_for_answerability_classification": 57.0, + "eval_rouge1_for_cause_effect_classification": 53.3372, + "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 8.1167, + "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.1305, + "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 57.0, + "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.9862, + "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 58.0, + "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, + "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rouge1_for_task534_farstail_textual_entailment": 16.0, + "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 55.0, + "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rouge1_for_textual_entailment": 21.1667, + "eval_rouge1_for_title_generation": 8.1167, + "eval_rougeL": 49.3795, + "eval_rougeL_for_answerability_classification": 57.0, + "eval_rougeL_for_cause_effect_classification": 53.3306, + "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, + "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 57.0, + "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, + "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, + "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, + "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, + "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, + "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.8667, + "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.1305, + "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 57.0, + "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 43.7862, + "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 58.0, + "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, + "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, + "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, + "eval_rougeL_for_task534_farstail_textual_entailment": 16.0, + "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 53.0, + "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 62.0, + "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 52.0, + "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 55.0, + "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, + "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, + "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, + "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, + "eval_rougeL_for_textual_entailment": 21.1667, + "eval_rougeL_for_title_generation": 7.8667, + "eval_runtime": 48.2804, + "eval_samples_per_second": 72.493, + "eval_steps_per_second": 1.139, + "step": 15000 + }, + { + "epoch": 2.0, + "step": 15062, + "total_flos": 1.5362031529597338e+18, + "train_loss": 1.2364440905811966, + "train_runtime": 83936.7952, + "train_samples_per_second": 2.871, + "train_steps_per_second": 0.179 + } + ], + "max_steps": 15062, + "num_train_epochs": 2, + "total_flos": 1.5362031529597338e+18, + "trial_name": null, + "trial_params": null +}