{ "best_metric": 50.9114, "best_model_checkpoint": "/output/checkpoint-10000", "epoch": 2.0, "global_step": 15062, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.0, "loss": 11.2617, "step": 1 }, { "epoch": 0.0, "eval_exact_match": 0.0, "eval_exact_match_for_answerability_classification": 0.0, "eval_exact_match_for_cause_effect_classification": 0.0, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 0.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 0.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 0.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 0.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 0.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 0.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 0.0, "eval_exact_match_for_textual_entailment": 0.0, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 4.2644, "eval_f1_for_answerability_classification": 1.8668, "eval_f1_for_cause_effect_classification": 4.344, "eval_f1_for_task1168_xcopa_cause_effect_classification": 3.471, "eval_f1_for_task1169_xcopa_cause_effect_classification": 3.1606, "eval_f1_for_task1170_xcopa_cause_effect_classification": 3.6846, "eval_f1_for_task1171_xcopa_cause_effect_classification": 3.2959, "eval_f1_for_task1172_xcopa_cause_effect_classification": 2.4751, "eval_f1_for_task1173_xcopa_cause_effect_classification": 3.3739, "eval_f1_for_task1174_xcopa_cause_effect_classification": 2.7326, "eval_f1_for_task1175_xcopa_cause_effect_classification": 3.4745, "eval_f1_for_task1176_xcopa_cause_effect_classification": 3.1997, "eval_f1_for_task1177_xcopa_cause_effect_classification": 3.2799, "eval_f1_for_task1178_xcopa_cause_effect_classification": 5.1837, "eval_f1_for_task1179_xcopa_cause_effect_classification": 4.1242, "eval_f1_for_task1180_xcopa_cause_effect_classification": 3.8632, "eval_f1_for_task1181_xcopa_cause_effect_classification": 4.7895, "eval_f1_for_task1182_xcopa_cause_effect_classification": 3.4823, "eval_f1_for_task1183_xcopa_cause_effect_classification": 3.3336, "eval_f1_for_task1184_xcopa_cause_effect_classification": 2.0693, "eval_f1_for_task1185_xcopa_cause_effect_classification": 5.1318, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 4.1919, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 13.1647, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 2.3551, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 4.0293, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 2.7788, "eval_f1_for_task396_persianqa_answerability_classification": 1.8668, "eval_f1_for_task463_pasinlu_textual_entailment": 2.4353, "eval_f1_for_task464_pasinlu_textual_entailment": 8.3545, "eval_f1_for_task534_farstail_textual_entailment": 2.0874, "eval_f1_for_task938_indicnlp_cause_effect_classification": 6.9245, "eval_f1_for_task939_indicnlp_cause_effect_classification": 4.611, "eval_f1_for_task940_indicnlp_cause_effect_classification": 7.979, "eval_f1_for_task941_indicnlp_cause_effect_classification": 5.4811, "eval_f1_for_task942_indicnlp_cause_effect_classification": 6.9087, "eval_f1_for_task943_indicnlp_cause_effect_classification": 3.1593, "eval_f1_for_task968_xcopa_cause_effect_classification": 4.2922, "eval_f1_for_task969_xcopa_cause_effect_classification": 4.51, "eval_f1_for_textual_entailment": 4.2924, "eval_f1_for_title_generation": 4.1919, "eval_gen_len": 111.9417, "eval_global_step": 1, "eval_loss": 14.192606925964355, "eval_rouge1": 3.1222, "eval_rouge1_for_answerability_classification": 2.0936, "eval_rouge1_for_cause_effect_classification": 3.418, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 2.9198, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 2.1195, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 4.1343, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 2.2827, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 3.0535, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 2.5602, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 2.6335, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 2.631, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 3.7264, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 2.7074, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 4.5135, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 2.6166, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 3.5439, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 3.159, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 2.7565, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 2.2842, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 3.4868, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 3.3792, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 0.36, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 10.5917, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 1.8427, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 3.6141, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 2.0352, "eval_rouge1_for_task396_persianqa_answerability_classification": 2.0936, "eval_rouge1_for_task463_pasinlu_textual_entailment": 2.3758, "eval_rouge1_for_task464_pasinlu_textual_entailment": 0.0491, "eval_rouge1_for_task534_farstail_textual_entailment": 1.8557, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 3.5991, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 3.9341, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 4.1945, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 4.8076, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 4.1962, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 2.1487, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 4.0485, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 3.0208, "eval_rouge1_for_textual_entailment": 1.4269, "eval_rouge1_for_title_generation": 0.36, "eval_rougeL": 3.1178, "eval_rougeL_for_answerability_classification": 2.0936, "eval_rougeL_for_cause_effect_classification": 3.413, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 2.9198, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 2.1195, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 4.1343, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 2.2827, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 3.0535, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 2.5602, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 2.6335, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 2.631, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 3.7264, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 2.7074, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 4.5135, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 2.6166, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 3.5439, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 3.159, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 2.7565, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 2.2842, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 3.4868, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 3.3792, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 0.36, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 10.474, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 1.8427, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 3.5796, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 2.0352, "eval_rougeL_for_task396_persianqa_answerability_classification": 2.0936, "eval_rougeL_for_task463_pasinlu_textual_entailment": 2.3758, "eval_rougeL_for_task464_pasinlu_textual_entailment": 0.0491, "eval_rougeL_for_task534_farstail_textual_entailment": 1.8557, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 3.5991, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 3.9341, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 4.1945, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 4.8076, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 4.1962, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 2.1487, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 4.0485, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 3.0208, "eval_rougeL_for_textual_entailment": 1.4269, "eval_rougeL_for_title_generation": 0.36, "eval_runtime": 410.3185, "eval_samples_per_second": 8.53, "eval_steps_per_second": 0.134, "step": 1 }, { "epoch": 0.01, "learning_rate": 5e-05, "loss": 4.395, "step": 50 }, { "epoch": 0.01, "eval_exact_match": 41.4857, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 44.5, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 20.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 5.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 0.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_textual_entailment": 22.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 44.8407, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 47.9961, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 8.2131, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 28.7008, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 15.5144, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, "eval_f1_for_task464_pasinlu_textual_entailment": 5.3294, "eval_f1_for_task534_farstail_textual_entailment": 33.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 27.3333, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 33.3333, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_f1_for_textual_entailment": 23.7765, "eval_f1_for_title_generation": 8.2131, "eval_gen_len": 2.8286, "eval_global_step": 50, "eval_loss": 0.9278950691223145, "eval_rouge1": 44.6676, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 48.1566, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 1.6667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 28.4918, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 15.2061, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 41.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_textual_entailment": 22.3333, "eval_rouge1_for_title_generation": 1.6667, "eval_rougeL": 44.6676, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 48.1566, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 1.6667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 28.4918, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 15.2061, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 41.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_textual_entailment": 22.3333, "eval_rougeL_for_title_generation": 1.6667, "eval_runtime": 52.7494, "eval_samples_per_second": 66.351, "eval_steps_per_second": 1.043, "step": 50 }, { "epoch": 0.01, "learning_rate": 5e-05, "loss": 2.0981, "step": 100 }, { "epoch": 0.01, "eval_exact_match": 46.2571, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 50.1, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 32.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 32.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 21.3333, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 50.3202, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 53.9093, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 11.4378, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.7794, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.9984, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 32.0, "eval_f1_for_task464_pasinlu_textual_entailment": 18.4906, "eval_f1_for_task534_farstail_textual_entailment": 32.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 27.4969, "eval_f1_for_title_generation": 11.4378, "eval_gen_len": 3.4271, "eval_global_step": 100, "eval_loss": 0.5112689733505249, "eval_rouge1": 47.4081, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 51.3773, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 2.9667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.0879, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.2301, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 32.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 32.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 21.6667, "eval_rouge1_for_title_generation": 2.9667, "eval_rougeL": 47.4034, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 51.3717, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 2.9667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.0879, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.0634, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 32.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 32.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 21.6667, "eval_rougeL_for_title_generation": 2.9667, "eval_runtime": 49.8187, "eval_samples_per_second": 70.255, "eval_steps_per_second": 1.104, "step": 100 }, { "epoch": 0.03, "learning_rate": 5e-05, "loss": 1.903, "step": 200 }, { "epoch": 0.03, "eval_exact_match": 45.3714, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 49.0333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 18.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 31.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 21.6667, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 49.5606, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 52.8281, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 9.8754, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 71.8608, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 37.9808, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, "eval_f1_for_task464_pasinlu_textual_entailment": 24.903, "eval_f1_for_task534_farstail_textual_entailment": 31.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 29.9677, "eval_f1_for_title_generation": 9.8754, "eval_gen_len": 3.4326, "eval_global_step": 200, "eval_loss": 0.4994029104709625, "eval_rouge1": 46.5531, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 50.3136, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 3.45, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 71.5543, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.8534, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 31.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 22.1667, "eval_rouge1_for_title_generation": 3.45, "eval_rougeL": 46.5374, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 50.3036, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 3.2, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 71.5543, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.5534, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 31.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 22.1667, "eval_rougeL_for_title_generation": 3.2, "eval_runtime": 47.216, "eval_samples_per_second": 74.127, "eval_steps_per_second": 1.165, "step": 200 }, { "epoch": 0.07, "learning_rate": 5e-05, "loss": 1.7406, "step": 500 }, { "epoch": 0.07, "eval_exact_match": 45.6286, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 49.2667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 58.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 22.6667, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 49.876, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 52.8919, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 16.1737, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 73.2462, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.5102, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, "eval_f1_for_task464_pasinlu_textual_entailment": 25.7294, "eval_f1_for_task534_farstail_textual_entailment": 34.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 30.9098, "eval_f1_for_title_generation": 16.1737, "eval_gen_len": 4.2251, "eval_global_step": 500, "eval_loss": 0.4882946312427521, "eval_rouge1": 46.7309, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 50.3514, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.3726, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 72.734, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.8093, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.6667, "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 22.8889, "eval_rouge1_for_title_generation": 6.3726, "eval_rougeL": 46.7252, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 50.3448, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.3726, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 72.734, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.6093, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.6667, "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 22.8889, "eval_rougeL_for_title_generation": 6.3726, "eval_runtime": 51.2553, "eval_samples_per_second": 68.286, "eval_steps_per_second": 1.073, "step": 500 }, { "epoch": 0.13, "learning_rate": 5e-05, "loss": 1.5969, "step": 1000 }, { "epoch": 0.13, "eval_exact_match": 44.4286, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 47.9333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 45.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 41.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 46.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 47.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 45.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 17.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 44.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 22.3333, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 48.7078, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 51.5153, "eval_f1_for_task1168_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 45.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 41.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 46.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 47.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 16.7735, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 61.5139, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 32.9466, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, "eval_f1_for_task464_pasinlu_textual_entailment": 25.54, "eval_f1_for_task534_farstail_textual_entailment": 34.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 44.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 30.8467, "eval_f1_for_title_generation": 16.7735, "eval_gen_len": 4.3826, "eval_global_step": 1000, "eval_loss": 0.47427454590797424, "eval_rouge1": 45.5347, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 48.9838, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 45.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 41.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 46.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 47.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.7, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 61.3384, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 32.1749, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 44.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 22.8333, "eval_rouge1_for_title_generation": 5.7, "eval_rougeL": 45.5246, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 48.972, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 45.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 41.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 46.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 47.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.7, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 61.1846, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 31.9749, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 44.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 22.8333, "eval_rougeL_for_title_generation": 5.7, "eval_runtime": 60.9063, "eval_samples_per_second": 57.465, "eval_steps_per_second": 0.903, "step": 1000 }, { "epoch": 0.2, "learning_rate": 5e-05, "loss": 1.4937, "step": 1500 }, { "epoch": 0.2, "eval_exact_match": 45.6571, "eval_exact_match_for_answerability_classification": 49.0, "eval_exact_match_for_cause_effect_classification": 49.3667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 44.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 42.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 40.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 46.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 33.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 48.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 49.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 22.3333, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 49.9636, "eval_f1_for_answerability_classification": 49.0, "eval_f1_for_cause_effect_classification": 52.7891, "eval_f1_for_task1168_xcopa_cause_effect_classification": 44.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 42.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 40.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 46.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.431, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.8772, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 47.7961, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 48.0, "eval_f1_for_task396_persianqa_answerability_classification": 49.0, "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.6215, "eval_f1_for_task534_farstail_textual_entailment": 33.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 77.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 31.2072, "eval_f1_for_title_generation": 22.431, "eval_gen_len": 4.6006, "eval_global_step": 1500, "eval_loss": 0.4453420639038086, "eval_rouge1": 46.7181, "eval_rouge1_for_answerability_classification": 49.0, "eval_rouge1_for_cause_effect_classification": 50.3361, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 44.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 42.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 40.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 46.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.5492, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.6298, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 47.4533, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 48.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 49.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 22.8333, "eval_rouge1_for_title_generation": 7.5492, "eval_rougeL": 46.7052, "eval_rougeL_for_answerability_classification": 49.0, "eval_rougeL_for_cause_effect_classification": 50.3294, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 44.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 42.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 40.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 46.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.2992, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.6298, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 47.2533, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 48.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 49.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 22.8333, "eval_rougeL_for_title_generation": 7.2992, "eval_runtime": 54.9496, "eval_samples_per_second": 63.695, "eval_steps_per_second": 1.001, "step": 1500 }, { "epoch": 0.27, "learning_rate": 5e-05, "loss": 1.4808, "step": 2000 }, { "epoch": 0.27, "eval_exact_match": 46.4857, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 50.2333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 46.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 43.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 44.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 35.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_textual_entailment": 23.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 50.859, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 53.7262, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 46.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 43.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 44.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.6628, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.642, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 36.1429, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 35.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.6186, "eval_f1_for_task534_farstail_textual_entailment": 33.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 61.0, "eval_f1_for_textual_entailment": 31.8729, "eval_f1_for_title_generation": 22.6628, "eval_gen_len": 4.3834, "eval_global_step": 2000, "eval_loss": 0.4502388536930084, "eval_rouge1": 47.5331, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 51.2125, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 46.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 43.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 44.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.7827, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.4834, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.8921, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 35.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_textual_entailment": 23.1667, "eval_rouge1_for_title_generation": 7.7827, "eval_rougeL": 47.5274, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 51.2059, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 46.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 43.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 44.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.7827, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.4834, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.6921, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 35.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_textual_entailment": 23.1667, "eval_rougeL_for_title_generation": 7.7827, "eval_runtime": 56.4908, "eval_samples_per_second": 61.957, "eval_steps_per_second": 0.974, "step": 2000 }, { "epoch": 0.33, "learning_rate": 5e-05, "loss": 1.4142, "step": 2500 }, { "epoch": 0.33, "eval_exact_match": 45.9143, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 49.5667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_textual_entailment": 22.6667, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 49.9839, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 53.1953, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 11.6421, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.4947, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 37.3657, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, "eval_f1_for_task464_pasinlu_textual_entailment": 24.9355, "eval_f1_for_task534_farstail_textual_entailment": 34.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_f1_for_textual_entailment": 30.6452, "eval_f1_for_title_generation": 11.6421, "eval_gen_len": 3.8066, "eval_global_step": 2500, "eval_loss": 0.4557723104953766, "eval_rouge1": 46.8499, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 50.6725, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 1.5714, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.4087, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 36.7677, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_textual_entailment": 22.6667, "eval_rouge1_for_title_generation": 1.5714, "eval_rougeL": 46.8385, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 50.6592, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 1.5714, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.2087, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 36.5677, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_textual_entailment": 22.6667, "eval_rougeL_for_title_generation": 1.5714, "eval_runtime": 52.9945, "eval_samples_per_second": 66.045, "eval_steps_per_second": 1.038, "step": 2500 }, { "epoch": 0.4, "learning_rate": 5e-05, "loss": 1.424, "step": 3000 }, { "epoch": 0.4, "eval_exact_match": 45.2571, "eval_exact_match_for_answerability_classification": 48.0, "eval_exact_match_for_cause_effect_classification": 49.8, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 47.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 45.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 48.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 6.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 48.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_textual_entailment": 13.6667, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 49.544, "eval_f1_for_answerability_classification": 48.0, "eval_f1_for_cause_effect_classification": 53.3133, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 47.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 45.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 20.0148, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3859, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.012, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 51.0, "eval_f1_for_task396_persianqa_answerability_classification": 48.0, "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.628, "eval_f1_for_task534_farstail_textual_entailment": 6.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 48.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_f1_for_textual_entailment": 22.2093, "eval_f1_for_title_generation": 20.0148, "eval_gen_len": 4.2606, "eval_global_step": 3000, "eval_loss": 0.49717187881469727, "eval_rouge1": 46.25, "eval_rouge1_for_answerability_classification": 48.0, "eval_rouge1_for_cause_effect_classification": 50.7961, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 47.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 45.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.8667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.3101, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.5737, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 51.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 48.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 6.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 48.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_textual_entailment": 13.6667, "eval_rouge1_for_title_generation": 5.8667, "eval_rougeL": 46.25, "eval_rougeL_for_answerability_classification": 48.0, "eval_rougeL_for_cause_effect_classification": 50.7961, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 47.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 45.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.8667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.3101, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.5737, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 51.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 48.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 6.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 48.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_textual_entailment": 13.6667, "eval_rougeL_for_title_generation": 5.8667, "eval_runtime": 51.2339, "eval_samples_per_second": 68.314, "eval_steps_per_second": 1.074, "step": 3000 }, { "epoch": 0.46, "learning_rate": 5e-05, "loss": 1.3657, "step": 3500 }, { "epoch": 0.46, "eval_exact_match": 46.0, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 49.4333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 49.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 39.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 47.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 25.0, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 50.4343, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 53.0825, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.5353, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.5879, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.8877, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 39.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.1911, "eval_f1_for_task534_farstail_textual_entailment": 35.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 73.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 33.397, "eval_f1_for_title_generation": 22.5353, "eval_gen_len": 4.2649, "eval_global_step": 3500, "eval_loss": 0.4972946345806122, "eval_rouge1": 47.073, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 50.493, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.7667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.3856, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.4042, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 39.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 47.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 25.0, "eval_rouge1_for_title_generation": 7.7667, "eval_rougeL": 47.0673, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 50.4863, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.7667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.3856, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.2042, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 39.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 47.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 25.0, "eval_rougeL_for_title_generation": 7.7667, "eval_runtime": 50.353, "eval_samples_per_second": 69.509, "eval_steps_per_second": 1.092, "step": 3500 }, { "epoch": 0.53, "learning_rate": 5e-05, "loss": 1.3591, "step": 4000 }, { "epoch": 0.53, "eval_exact_match": 45.0, "eval_exact_match_for_answerability_classification": 53.0, "eval_exact_match_for_cause_effect_classification": 49.5333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 53.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 0.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_textual_entailment": 11.6667, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 49.2805, "eval_f1_for_answerability_classification": 53.0, "eval_f1_for_cause_effect_classification": 53.0349, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 19.2178, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.9583, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 43.5893, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task396_persianqa_answerability_classification": 53.0, "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.551, "eval_f1_for_task534_farstail_textual_entailment": 0.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 77.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_f1_for_textual_entailment": 20.517, "eval_f1_for_title_generation": 19.2178, "eval_gen_len": 4.3746, "eval_global_step": 4000, "eval_loss": 0.5541166067123413, "eval_rouge1": 46.1285, "eval_rouge1_for_answerability_classification": 53.0, "eval_rouge1_for_cause_effect_classification": 50.6331, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.5048, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.8166, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.1766, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 53.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 0.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_textual_entailment": 11.6667, "eval_rouge1_for_title_generation": 7.5048, "eval_rougeL": 46.1228, "eval_rougeL_for_answerability_classification": 53.0, "eval_rougeL_for_cause_effect_classification": 50.6264, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.5048, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.8166, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.9766, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 53.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 0.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_textual_entailment": 11.6667, "eval_rougeL_for_title_generation": 7.5048, "eval_runtime": 56.9164, "eval_samples_per_second": 61.494, "eval_steps_per_second": 0.966, "step": 4000 }, { "epoch": 0.6, "learning_rate": 5e-05, "loss": 1.334, "step": 4500 }, { "epoch": 0.6, "eval_exact_match": 48.1429, "eval_exact_match_for_answerability_classification": 68.0, "eval_exact_match_for_cause_effect_classification": 51.4667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 20.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 68.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 37.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_textual_entailment": 24.3333, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 52.5952, "eval_f1_for_answerability_classification": 68.0, "eval_f1_for_cause_effect_classification": 55.0366, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.4279, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 73.2258, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 35.8708, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task396_persianqa_answerability_classification": 68.0, "eval_f1_for_task463_pasinlu_textual_entailment": 37.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.3083, "eval_f1_for_task534_farstail_textual_entailment": 35.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_f1_for_textual_entailment": 32.7694, "eval_f1_for_title_generation": 23.4279, "eval_gen_len": 4.2037, "eval_global_step": 4500, "eval_loss": 0.44648101925849915, "eval_rouge1": 49.2638, "eval_rouge1_for_answerability_classification": 68.0, "eval_rouge1_for_cause_effect_classification": 52.5205, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.95, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 73.343, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.2724, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 68.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 37.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.6667, "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_textual_entailment": 24.5556, "eval_rouge1_for_title_generation": 6.95, "eval_rougeL": 49.2509, "eval_rougeL_for_answerability_classification": 68.0, "eval_rougeL_for_cause_effect_classification": 52.5138, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.7, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 73.343, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.0724, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 68.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 37.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.6667, "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_textual_entailment": 24.5556, "eval_rougeL_for_title_generation": 6.7, "eval_runtime": 56.8208, "eval_samples_per_second": 61.597, "eval_steps_per_second": 0.968, "step": 4500 }, { "epoch": 0.66, "learning_rate": 5e-05, "loss": 1.3219, "step": 5000 }, { "epoch": 0.66, "eval_exact_match": 45.7143, "eval_exact_match_for_answerability_classification": 50.0, "eval_exact_match_for_cause_effect_classification": 49.6667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 22.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 50.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 31.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 27.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_textual_entailment": 19.6667, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 50.1301, "eval_f1_for_answerability_classification": 50.0, "eval_f1_for_cause_effect_classification": 53.2505, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.1179, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.5094, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 36.0067, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task396_persianqa_answerability_classification": 50.0, "eval_f1_for_task463_pasinlu_textual_entailment": 31.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.9195, "eval_f1_for_task534_farstail_textual_entailment": 27.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_f1_for_textual_entailment": 28.6398, "eval_f1_for_title_generation": 21.1179, "eval_gen_len": 4.4071, "eval_global_step": 5000, "eval_loss": 0.5046093463897705, "eval_rouge1": 46.8082, "eval_rouge1_for_answerability_classification": 50.0, "eval_rouge1_for_cause_effect_classification": 50.7351, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.7333, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.4986, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 35.5551, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 50.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 31.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 27.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_textual_entailment": 19.8333, "eval_rouge1_for_title_generation": 6.7333, "eval_rougeL": 46.8025, "eval_rougeL_for_answerability_classification": 50.0, "eval_rougeL_for_cause_effect_classification": 50.7285, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.7333, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.2986, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 51.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 35.5551, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 50.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 31.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 27.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_textual_entailment": 19.8333, "eval_rougeL_for_title_generation": 6.7333, "eval_runtime": 52.9633, "eval_samples_per_second": 66.084, "eval_steps_per_second": 1.038, "step": 5000 }, { "epoch": 0.73, "learning_rate": 5e-05, "loss": 1.2949, "step": 5500 }, { "epoch": 0.73, "eval_exact_match": 47.8, "eval_exact_match_for_answerability_classification": 57.0, "eval_exact_match_for_cause_effect_classification": 51.2333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 49.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 32.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 45.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_textual_entailment": 26.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 52.1079, "eval_f1_for_answerability_classification": 57.0, "eval_f1_for_cause_effect_classification": 54.6733, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.96, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.4703, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.7293, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_f1_for_task396_persianqa_answerability_classification": 57.0, "eval_f1_for_task463_pasinlu_textual_entailment": 32.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.6166, "eval_f1_for_task534_farstail_textual_entailment": 45.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_f1_for_textual_entailment": 34.8722, "eval_f1_for_title_generation": 21.96, "eval_gen_len": 4.344, "eval_global_step": 5500, "eval_loss": 0.5085814595222473, "eval_rouge1": 48.773, "eval_rouge1_for_answerability_classification": 57.0, "eval_rouge1_for_cause_effect_classification": 52.1813, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.6167, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.3426, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.0955, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 32.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 45.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_textual_entailment": 26.0, "eval_rouge1_for_title_generation": 6.6167, "eval_rougeL": 48.773, "eval_rougeL_for_answerability_classification": 57.0, "eval_rougeL_for_cause_effect_classification": 52.1813, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 65.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.6167, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.3426, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.0955, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 32.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 45.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_textual_entailment": 26.0, "eval_rougeL_for_title_generation": 6.6167, "eval_runtime": 54.0521, "eval_samples_per_second": 64.752, "eval_steps_per_second": 1.018, "step": 5500 }, { "epoch": 0.8, "learning_rate": 5e-05, "loss": 1.3032, "step": 6000 }, { "epoch": 0.8, "eval_exact_match": 48.0286, "eval_exact_match_for_answerability_classification": 52.0, "eval_exact_match_for_cause_effect_classification": 51.6667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 66.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 46.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 17.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 52.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 35.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_textual_entailment": 26.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 52.5448, "eval_f1_for_answerability_classification": 52.0, "eval_f1_for_cause_effect_classification": 55.2346, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 66.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.2404, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.1301, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 46.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 34.407, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_f1_for_task396_persianqa_answerability_classification": 52.0, "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.7902, "eval_f1_for_task534_farstail_textual_entailment": 35.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 79.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_f1_for_textual_entailment": 34.9301, "eval_f1_for_title_generation": 25.2404, "eval_gen_len": 4.1863, "eval_global_step": 6000, "eval_loss": 0.49761494994163513, "eval_rouge1": 49.2271, "eval_rouge1_for_answerability_classification": 52.0, "eval_rouge1_for_cause_effect_classification": 52.829, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 66.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.0778, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.6839, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 46.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 34.1859, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 52.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, "eval_rouge1_for_task534_farstail_textual_entailment": 35.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_textual_entailment": 26.3333, "eval_rouge1_for_title_generation": 7.0778, "eval_rougeL": 49.2156, "eval_rougeL_for_answerability_classification": 52.0, "eval_rougeL_for_cause_effect_classification": 52.8157, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 66.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.0778, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.4839, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 46.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 33.9859, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 55.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 52.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, "eval_rougeL_for_task534_farstail_textual_entailment": 35.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_textual_entailment": 26.3333, "eval_rougeL_for_title_generation": 7.0778, "eval_runtime": 48.9982, "eval_samples_per_second": 71.431, "eval_steps_per_second": 1.122, "step": 6000 }, { "epoch": 0.86, "learning_rate": 5e-05, "loss": 1.3026, "step": 6500 }, { "epoch": 0.86, "eval_exact_match": 47.2857, "eval_exact_match_for_answerability_classification": 63.0, "eval_exact_match_for_cause_effect_classification": 50.2333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 23.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 63.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 48.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_textual_entailment": 27.6667, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 51.8128, "eval_f1_for_answerability_classification": 63.0, "eval_f1_for_cause_effect_classification": 53.8076, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 26.241, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.4594, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.7673, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task396_persianqa_answerability_classification": 63.0, "eval_f1_for_task463_pasinlu_textual_entailment": 48.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.9787, "eval_f1_for_task534_farstail_textual_entailment": 34.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 49.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_f1_for_textual_entailment": 36.6596, "eval_f1_for_title_generation": 26.241, "eval_gen_len": 4.2337, "eval_global_step": 6500, "eval_loss": 0.4878259003162384, "eval_rouge1": 48.4413, "eval_rouge1_for_answerability_classification": 63.0, "eval_rouge1_for_cause_effect_classification": 51.2755, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.1803, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.0246, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 38.2396, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 63.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 48.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_textual_entailment": 28.0, "eval_rouge1_for_title_generation": 10.1803, "eval_rougeL": 48.4084, "eval_rougeL_for_answerability_classification": 63.0, "eval_rougeL_for_cause_effect_classification": 51.2621, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.4303, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.8246, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 38.0396, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 63.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 48.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_textual_entailment": 28.0, "eval_rougeL_for_title_generation": 9.4303, "eval_runtime": 55.9532, "eval_samples_per_second": 62.552, "eval_steps_per_second": 0.983, "step": 6500 }, { "epoch": 0.93, "learning_rate": 5e-05, "loss": 1.3001, "step": 7000 }, { "epoch": 0.93, "eval_exact_match": 48.4, "eval_exact_match_for_answerability_classification": 59.0, "eval_exact_match_for_cause_effect_classification": 52.1333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 28.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 59.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 34.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_textual_entailment": 22.6667, "eval_exact_match_for_title_generation": 3.0, "eval_f1": 52.9111, "eval_f1_for_answerability_classification": 59.0, "eval_f1_for_cause_effect_classification": 55.7378, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.1245, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 71.3489, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 43.7847, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_f1_for_task396_persianqa_answerability_classification": 59.0, "eval_f1_for_task463_pasinlu_textual_entailment": 34.0, "eval_f1_for_task464_pasinlu_textual_entailment": 28.6292, "eval_f1_for_task534_farstail_textual_entailment": 33.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 57.0, "eval_f1_for_textual_entailment": 31.8764, "eval_f1_for_title_generation": 25.1245, "eval_gen_len": 4.2043, "eval_global_step": 7000, "eval_loss": 0.502213180065155, "eval_rouge1": 49.4586, "eval_rouge1_for_answerability_classification": 59.0, "eval_rouge1_for_cause_effect_classification": 53.215, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.6, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 71.0823, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.367, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 59.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 34.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_textual_entailment": 22.6667, "eval_rouge1_for_title_generation": 7.6, "eval_rougeL": 49.4471, "eval_rougeL_for_answerability_classification": 59.0, "eval_rougeL_for_cause_effect_classification": 53.2016, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.6, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.8823, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 43.167, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 59.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 34.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_textual_entailment": 22.6667, "eval_rougeL_for_title_generation": 7.6, "eval_runtime": 52.3007, "eval_samples_per_second": 66.921, "eval_steps_per_second": 1.052, "step": 7000 }, { "epoch": 1.0, "learning_rate": 5e-05, "loss": 1.2703, "step": 7500 }, { "epoch": 1.0, "eval_exact_match": 45.5429, "eval_exact_match_for_answerability_classification": 57.0, "eval_exact_match_for_cause_effect_classification": 49.9333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 24.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 35.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 3.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_textual_entailment": 12.6667, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 50.0887, "eval_f1_for_answerability_classification": 57.0, "eval_f1_for_cause_effect_classification": 53.5186, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 25.1866, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.9928, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 38.5649, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task396_persianqa_answerability_classification": 57.0, "eval_f1_for_task463_pasinlu_textual_entailment": 35.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.361, "eval_f1_for_task534_farstail_textual_entailment": 3.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_f1_for_textual_entailment": 21.787, "eval_f1_for_title_generation": 25.1866, "eval_gen_len": 4.4051, "eval_global_step": 7500, "eval_loss": 0.5247823596000671, "eval_rouge1": 46.6911, "eval_rouge1_for_answerability_classification": 57.0, "eval_rouge1_for_cause_effect_classification": 50.9887, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 8.5273, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 64.7567, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 37.9049, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 35.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 3.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_textual_entailment": 13.0, "eval_rouge1_for_title_generation": 8.5273, "eval_rougeL": 46.6725, "eval_rougeL_for_answerability_classification": 57.0, "eval_rougeL_for_cause_effect_classification": 50.9754, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 8.2773, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 64.5567, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 37.7049, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 35.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 3.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_textual_entailment": 13.0, "eval_rougeL_for_title_generation": 8.2773, "eval_runtime": 53.4229, "eval_samples_per_second": 65.515, "eval_steps_per_second": 1.03, "step": 7500 }, { "epoch": 1.06, "learning_rate": 5e-05, "loss": 1.0752, "step": 8000 }, { "epoch": 1.06, "eval_exact_match": 49.6286, "eval_exact_match_for_answerability_classification": 64.0, "eval_exact_match_for_cause_effect_classification": 53.0667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 47.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 59.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 33.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 57.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_textual_entailment": 26.3333, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 54.0585, "eval_f1_for_answerability_classification": 64.0, "eval_f1_for_cause_effect_classification": 56.6185, "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 24.7119, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 65.9217, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.134, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 59.0, "eval_f1_for_task396_persianqa_answerability_classification": 64.0, "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.7787, "eval_f1_for_task534_farstail_textual_entailment": 33.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 57.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_f1_for_textual_entailment": 34.9262, "eval_f1_for_title_generation": 24.7119, "eval_gen_len": 4.2411, "eval_global_step": 8000, "eval_loss": 0.48732811212539673, "eval_rouge1": 50.7222, "eval_rouge1_for_answerability_classification": 64.0, "eval_rouge1_for_cause_effect_classification": 54.1718, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.1237, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 65.4976, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.6573, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 59.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 33.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 57.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_textual_entailment": 26.3333, "eval_rouge1_for_title_generation": 7.1237, "eval_rougeL": 50.7222, "eval_rougeL_for_answerability_classification": 64.0, "eval_rougeL_for_cause_effect_classification": 54.1718, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 47.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 68.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.1237, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 65.4976, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.6573, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 59.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 33.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 56.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 57.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_textual_entailment": 26.3333, "eval_rougeL_for_title_generation": 7.1237, "eval_runtime": 51.5603, "eval_samples_per_second": 67.882, "eval_steps_per_second": 1.067, "step": 8000 }, { "epoch": 1.13, "learning_rate": 5e-05, "loss": 1.0244, "step": 8500 }, { "epoch": 1.13, "eval_exact_match": 48.1143, "eval_exact_match_for_answerability_classification": 62.0, "eval_exact_match_for_cause_effect_classification": 52.2, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 40.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 23.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 33.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 23.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 48.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 48.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_textual_entailment": 18.6667, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 52.8712, "eval_f1_for_answerability_classification": 62.0, "eval_f1_for_cause_effect_classification": 56.0091, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 26.6965, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 60.2113, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.5611, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_f1_for_task396_persianqa_answerability_classification": 62.0, "eval_f1_for_task463_pasinlu_textual_entailment": 33.0, "eval_f1_for_task464_pasinlu_textual_entailment": 25.5214, "eval_f1_for_task534_farstail_textual_entailment": 23.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 74.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_f1_for_textual_entailment": 27.1738, "eval_f1_for_title_generation": 26.6965, "eval_gen_len": 4.112, "eval_global_step": 8500, "eval_loss": 0.5391484498977661, "eval_rouge1": 49.5027, "eval_rouge1_for_answerability_classification": 62.0, "eval_rouge1_for_cause_effect_classification": 53.4298, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.2, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 59.8095, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.084, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 33.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 23.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 48.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 48.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_textual_entailment": 19.1667, "eval_rouge1_for_title_generation": 10.2, "eval_rougeL": 49.5027, "eval_rougeL_for_answerability_classification": 62.0, "eval_rougeL_for_cause_effect_classification": 53.4298, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 10.2, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 59.8095, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.084, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 33.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 23.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 48.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 48.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_textual_entailment": 19.1667, "eval_rougeL_for_title_generation": 10.2, "eval_runtime": 51.3401, "eval_samples_per_second": 68.173, "eval_steps_per_second": 1.071, "step": 8500 }, { "epoch": 1.2, "learning_rate": 5e-05, "loss": 1.0551, "step": 9000 }, { "epoch": 1.2, "eval_exact_match": 48.1143, "eval_exact_match_for_answerability_classification": 71.0, "eval_exact_match_for_cause_effect_classification": 51.1667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 55.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 26.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 71.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 30.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 55.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 56.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_textual_entailment": 25.0, "eval_exact_match_for_title_generation": 3.0, "eval_f1": 52.7162, "eval_f1_for_answerability_classification": 71.0, "eval_f1_for_cause_effect_classification": 54.7681, "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 27.3639, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.3176, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 55.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.7249, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_f1_for_task396_persianqa_answerability_classification": 71.0, "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, "eval_f1_for_task464_pasinlu_textual_entailment": 28.659, "eval_f1_for_task534_farstail_textual_entailment": 30.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 55.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 56.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 52.0, "eval_f1_for_textual_entailment": 34.553, "eval_f1_for_title_generation": 27.3639, "eval_gen_len": 4.5371, "eval_global_step": 9000, "eval_loss": 0.5095714330673218, "eval_rouge1": 49.3168, "eval_rouge1_for_answerability_classification": 71.0, "eval_rouge1_for_cause_effect_classification": 52.28, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 10.1889, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.954, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 55.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.4462, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 71.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 30.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 55.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 56.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_textual_entailment": 25.5, "eval_rouge1_for_title_generation": 10.1889, "eval_rougeL": 49.3111, "eval_rougeL_for_answerability_classification": 71.0, "eval_rougeL_for_cause_effect_classification": 52.2733, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 10.1889, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.954, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 55.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.2462, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 71.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 30.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 55.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 56.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_textual_entailment": 25.5, "eval_rougeL_for_title_generation": 10.1889, "eval_runtime": 55.8217, "eval_samples_per_second": 62.7, "eval_steps_per_second": 0.985, "step": 9000 }, { "epoch": 1.26, "learning_rate": 5e-05, "loss": 1.073, "step": 9500 }, { "epoch": 1.26, "eval_exact_match": 49.2286, "eval_exact_match_for_answerability_classification": 61.0, "eval_exact_match_for_cause_effect_classification": 52.7667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 63.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 61.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 46.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 32.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 55.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_textual_entailment": 26.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 53.4079, "eval_f1_for_answerability_classification": 61.0, "eval_f1_for_cause_effect_classification": 56.0202, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 63.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.0851, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3659, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 41.7402, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_f1_for_task396_persianqa_answerability_classification": 61.0, "eval_f1_for_task463_pasinlu_textual_entailment": 46.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.5864, "eval_f1_for_task534_farstail_textual_entailment": 32.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 77.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 79.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_f1_for_textual_entailment": 34.8621, "eval_f1_for_title_generation": 23.0851, "eval_gen_len": 4.1429, "eval_global_step": 9500, "eval_loss": 0.5040011405944824, "eval_rouge1": 50.2692, "eval_rouge1_for_answerability_classification": 61.0, "eval_rouge1_for_cause_effect_classification": 53.7452, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 63.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.5667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.0282, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.3278, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 61.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 32.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 55.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_textual_entailment": 26.5, "eval_rouge1_for_title_generation": 6.5667, "eval_rougeL": 50.2635, "eval_rougeL_for_answerability_classification": 61.0, "eval_rougeL_for_cause_effect_classification": 53.7385, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 63.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.5667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 67.0282, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.1278, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 50.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 61.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 32.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 55.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_textual_entailment": 26.5, "eval_rougeL_for_title_generation": 6.5667, "eval_runtime": 50.7287, "eval_samples_per_second": 68.994, "eval_steps_per_second": 1.084, "step": 9500 }, { "epoch": 1.33, "learning_rate": 5e-05, "loss": 1.0736, "step": 10000 }, { "epoch": 1.33, "eval_exact_match": 49.7143, "eval_exact_match_for_answerability_classification": 67.0, "eval_exact_match_for_cause_effect_classification": 53.3, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 65.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 46.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 67.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 47.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 25.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 65.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_textual_entailment": 24.3333, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 54.0982, "eval_f1_for_answerability_classification": 67.0, "eval_f1_for_cause_effect_classification": 56.8652, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 65.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.1284, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 64.2905, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.1648, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task396_persianqa_answerability_classification": 67.0, "eval_f1_for_task463_pasinlu_textual_entailment": 47.0, "eval_f1_for_task464_pasinlu_textual_entailment": 25.3545, "eval_f1_for_task534_farstail_textual_entailment": 25.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 65.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 74.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 59.0, "eval_f1_for_textual_entailment": 32.4515, "eval_f1_for_title_generation": 23.1284, "eval_gen_len": 4.2194, "eval_global_step": 10000, "eval_loss": 0.5591691136360168, "eval_rouge1": 50.9114, "eval_rouge1_for_answerability_classification": 67.0, "eval_rouge1_for_cause_effect_classification": 54.3911, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 65.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 9.1667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 63.9211, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 41.8107, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 67.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 47.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 2.0, "eval_rouge1_for_task534_farstail_textual_entailment": 25.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 65.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_textual_entailment": 24.6667, "eval_rouge1_for_title_generation": 9.1667, "eval_rougeL": 50.9114, "eval_rougeL_for_answerability_classification": 67.0, "eval_rougeL_for_cause_effect_classification": 54.3911, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 65.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.1667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 63.9211, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.8107, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 67.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 47.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 2.0, "eval_rougeL_for_task534_farstail_textual_entailment": 25.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 65.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 49.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_textual_entailment": 24.6667, "eval_rougeL_for_title_generation": 9.1667, "eval_runtime": 53.0747, "eval_samples_per_second": 65.945, "eval_steps_per_second": 1.036, "step": 10000 }, { "epoch": 1.39, "learning_rate": 5e-05, "loss": 1.0635, "step": 10500 }, { "epoch": 1.39, "eval_exact_match": 49.4286, "eval_exact_match_for_answerability_classification": 60.0, "eval_exact_match_for_cause_effect_classification": 52.8, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 58.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 62.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 60.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 46.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 39.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 47.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_textual_entailment": 28.6667, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 53.8781, "eval_f1_for_answerability_classification": 60.0, "eval_f1_for_cause_effect_classification": 56.337, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.1671, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 74.3401, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 44.7686, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 62.0, "eval_f1_for_task396_persianqa_answerability_classification": 60.0, "eval_f1_for_task463_pasinlu_textual_entailment": 46.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.4562, "eval_f1_for_task534_farstail_textual_entailment": 39.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 47.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_f1_for_textual_entailment": 37.4854, "eval_f1_for_title_generation": 23.1671, "eval_gen_len": 4.2829, "eval_global_step": 10500, "eval_loss": 0.5000580549240112, "eval_rouge1": 50.5195, "eval_rouge1_for_answerability_classification": 60.0, "eval_rouge1_for_cause_effect_classification": 53.8171, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.6667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 74.2116, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 44.3028, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 62.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 60.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 39.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 47.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_textual_entailment": 28.6667, "eval_rouge1_for_title_generation": 7.6667, "eval_rougeL": 50.5195, "eval_rougeL_for_answerability_classification": 60.0, "eval_rougeL_for_cause_effect_classification": 53.8171, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.6667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 74.2116, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 44.3028, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 62.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 60.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 39.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 47.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_textual_entailment": 28.6667, "eval_rougeL_for_title_generation": 7.6667, "eval_runtime": 56.3252, "eval_samples_per_second": 62.139, "eval_steps_per_second": 0.976, "step": 10500 }, { "epoch": 1.46, "learning_rate": 5e-05, "loss": 1.0416, "step": 11000 }, { "epoch": 1.46, "eval_exact_match": 49.9714, "eval_exact_match_for_answerability_classification": 64.0, "eval_exact_match_for_cause_effect_classification": 53.5333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 70.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 63.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 41.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 36.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 48.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_textual_entailment": 26.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 54.3691, "eval_f1_for_answerability_classification": 64.0, "eval_f1_for_cause_effect_classification": 57.1392, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 70.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 63.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 20.8497, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 72.8568, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.8202, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task396_persianqa_answerability_classification": 64.0, "eval_f1_for_task463_pasinlu_textual_entailment": 41.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.8933, "eval_f1_for_task534_farstail_textual_entailment": 36.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 74.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 59.0, "eval_f1_for_textual_entailment": 34.6311, "eval_f1_for_title_generation": 20.8497, "eval_gen_len": 4.2114, "eval_global_step": 11000, "eval_loss": 0.5632901787757874, "eval_rouge1": 51.059, "eval_rouge1_for_answerability_classification": 64.0, "eval_rouge1_for_cause_effect_classification": 54.596, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 70.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 63.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 7.1857, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 72.6155, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.2633, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 41.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 36.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 48.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_textual_entailment": 26.0, "eval_rouge1_for_title_generation": 7.1857, "eval_rougeL": 51.0533, "eval_rougeL_for_answerability_classification": 64.0, "eval_rougeL_for_cause_effect_classification": 54.5893, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 70.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 63.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.1857, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 72.6155, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 42.0633, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 41.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 36.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 48.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 60.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_textual_entailment": 26.0, "eval_rougeL_for_title_generation": 7.1857, "eval_runtime": 50.6144, "eval_samples_per_second": 69.15, "eval_steps_per_second": 1.087, "step": 11000 }, { "epoch": 1.53, "learning_rate": 5e-05, "loss": 1.0416, "step": 11500 }, { "epoch": 1.53, "eval_exact_match": 47.5714, "eval_exact_match_for_answerability_classification": 76.0, "eval_exact_match_for_cause_effect_classification": 51.2333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 21.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 76.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 37.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 14.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 56.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_textual_entailment": 17.3333, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 52.1909, "eval_f1_for_answerability_classification": 76.0, "eval_f1_for_cause_effect_classification": 54.9215, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 23.6704, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 67.3374, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.3061, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_f1_for_task396_persianqa_answerability_classification": 76.0, "eval_f1_for_task463_pasinlu_textual_entailment": 37.0, "eval_f1_for_task464_pasinlu_textual_entailment": 28.3691, "eval_f1_for_task534_farstail_textual_entailment": 14.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 56.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_f1_for_textual_entailment": 26.4564, "eval_f1_for_title_generation": 23.6704, "eval_gen_len": 4.6251, "eval_global_step": 11500, "eval_loss": 0.49266964197158813, "eval_rouge1": 48.7653, "eval_rouge1_for_answerability_classification": 76.0, "eval_rouge1_for_cause_effect_classification": 52.3959, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.4111, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 67.1104, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 39.7656, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 76.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 37.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 14.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 56.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_textual_entailment": 17.5, "eval_rouge1_for_title_generation": 6.4111, "eval_rougeL": 48.7609, "eval_rougeL_for_answerability_classification": 76.0, "eval_rougeL_for_cause_effect_classification": 52.3907, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.4111, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 66.9565, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 39.7656, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 76.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 37.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 14.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 56.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_textual_entailment": 17.5, "eval_rougeL_for_title_generation": 6.4111, "eval_runtime": 55.2074, "eval_samples_per_second": 63.397, "eval_steps_per_second": 0.996, "step": 11500 }, { "epoch": 1.59, "learning_rate": 5e-05, "loss": 1.0514, "step": 12000 }, { "epoch": 1.59, "eval_exact_match": 49.5714, "eval_exact_match_for_answerability_classification": 74.0, "eval_exact_match_for_cause_effect_classification": 52.5667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 64.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 0.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 55.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 31.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 74.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 41.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 60.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_textual_entailment": 28.0, "eval_exact_match_for_title_generation": 0.0, "eval_f1": 53.9068, "eval_f1_for_answerability_classification": 74.0, "eval_f1_for_cause_effect_classification": 56.0614, "eval_f1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 64.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.0096, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.7858, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.0563, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task396_persianqa_answerability_classification": 74.0, "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, "eval_f1_for_task464_pasinlu_textual_entailment": 25.8876, "eval_f1_for_task534_farstail_textual_entailment": 41.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 60.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 57.0, "eval_f1_for_textual_entailment": 36.2959, "eval_f1_for_title_generation": 22.0096, "eval_gen_len": 4.0271, "eval_global_step": 12000, "eval_loss": 0.47120869159698486, "eval_rouge1": 50.6592, "eval_rouge1_for_answerability_classification": 74.0, "eval_rouge1_for_cause_effect_classification": 53.5865, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 64.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.9778, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.6986, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 45.8955, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 74.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 41.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 60.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_textual_entailment": 28.1667, "eval_rouge1_for_title_generation": 6.9778, "eval_rougeL": 50.6535, "eval_rougeL_for_answerability_classification": 74.0, "eval_rougeL_for_cause_effect_classification": 53.5798, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 64.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.9778, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.6986, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 49.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.6955, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 74.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 41.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 60.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_textual_entailment": 28.1667, "eval_rougeL_for_title_generation": 6.9778, "eval_runtime": 49.3521, "eval_samples_per_second": 70.919, "eval_steps_per_second": 1.114, "step": 12000 }, { "epoch": 1.66, "learning_rate": 5e-05, "loss": 1.0451, "step": 12500 }, { "epoch": 1.66, "eval_exact_match": 47.8, "eval_exact_match_for_answerability_classification": 64.0, "eval_exact_match_for_cause_effect_classification": 51.0333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 31.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 64.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 0.0, "eval_exact_match_for_task534_farstail_textual_entailment": 34.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_textual_entailment": 25.3333, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 52.3423, "eval_f1_for_answerability_classification": 64.0, "eval_f1_for_cause_effect_classification": 54.7372, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.1545, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.4465, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.6682, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task396_persianqa_answerability_classification": 64.0, "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.7129, "eval_f1_for_task534_farstail_textual_entailment": 34.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 53.0, "eval_f1_for_textual_entailment": 34.571, "eval_f1_for_title_generation": 22.1545, "eval_gen_len": 4.6566, "eval_global_step": 12500, "eval_loss": 0.5286997556686401, "eval_rouge1": 48.9372, "eval_rouge1_for_answerability_classification": 64.0, "eval_rouge1_for_cause_effect_classification": 52.2161, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.319, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.285, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 46.1972, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 64.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 34.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_textual_entailment": 25.6667, "eval_rouge1_for_title_generation": 5.319, "eval_rougeL": 48.9214, "eval_rougeL_for_answerability_classification": 64.0, "eval_rougeL_for_cause_effect_classification": 52.1976, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 48.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.319, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.9312, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.9972, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 64.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 34.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_textual_entailment": 25.6667, "eval_rougeL_for_title_generation": 5.319, "eval_runtime": 57.801, "eval_samples_per_second": 60.553, "eval_steps_per_second": 0.952, "step": 12500 }, { "epoch": 1.73, "learning_rate": 5e-05, "loss": 1.0371, "step": 13000 }, { "epoch": 1.73, "eval_exact_match": 48.1143, "eval_exact_match_for_answerability_classification": 62.0, "eval_exact_match_for_cause_effect_classification": 52.1333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 34.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 45.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 10.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 59.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_textual_entailment": 18.6667, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 52.5387, "eval_f1_for_answerability_classification": 62.0, "eval_f1_for_cause_effect_classification": 55.6905, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.0795, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 70.517, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 48.1994, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_f1_for_task396_persianqa_answerability_classification": 62.0, "eval_f1_for_task463_pasinlu_textual_entailment": 45.0, "eval_f1_for_task464_pasinlu_textual_entailment": 29.057, "eval_f1_for_task534_farstail_textual_entailment": 10.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 59.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_f1_for_textual_entailment": 28.019, "eval_f1_for_title_generation": 22.0795, "eval_gen_len": 4.4326, "eval_global_step": 13000, "eval_loss": 0.5131350159645081, "eval_rouge1": 49.2131, "eval_rouge1_for_answerability_classification": 62.0, "eval_rouge1_for_cause_effect_classification": 53.1587, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 9.697, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 70.1421, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 47.6192, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 45.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 10.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 59.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_textual_entailment": 18.6667, "eval_rouge1_for_title_generation": 9.697, "eval_rougeL": 49.2002, "eval_rougeL_for_answerability_classification": 62.0, "eval_rougeL_for_cause_effect_classification": 53.152, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 9.447, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 70.1421, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 52.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 47.4192, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 54.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 45.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 10.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 59.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 59.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_textual_entailment": 18.6667, "eval_rougeL_for_title_generation": 9.447, "eval_runtime": 52.3408, "eval_samples_per_second": 66.869, "eval_steps_per_second": 1.051, "step": 13000 }, { "epoch": 1.79, "learning_rate": 5e-05, "loss": 1.0494, "step": 13500 }, { "epoch": 1.79, "eval_exact_match": 48.2857, "eval_exact_match_for_answerability_classification": 58.0, "eval_exact_match_for_cause_effect_classification": 51.9, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 51.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 29.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 58.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 42.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 30.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_textual_entailment": 24.3333, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 52.5952, "eval_f1_for_answerability_classification": 58.0, "eval_f1_for_cause_effect_classification": 55.3688, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.267, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 66.5262, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 42.5375, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_f1_for_task396_persianqa_answerability_classification": 58.0, "eval_f1_for_task463_pasinlu_textual_entailment": 42.0, "eval_f1_for_task464_pasinlu_textual_entailment": 27.5012, "eval_f1_for_task534_farstail_textual_entailment": 30.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 58.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 61.0, "eval_f1_for_textual_entailment": 33.1671, "eval_f1_for_title_generation": 22.267, "eval_gen_len": 4.0611, "eval_global_step": 13500, "eval_loss": 0.5875681042671204, "eval_rouge1": 49.2211, "eval_rouge1_for_answerability_classification": 58.0, "eval_rouge1_for_cause_effect_classification": 52.8555, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.5744, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 66.5884, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 42.0767, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 58.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 42.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 30.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_textual_entailment": 24.5, "eval_rouge1_for_title_generation": 5.5744, "eval_rougeL": 49.2154, "eval_rougeL_for_answerability_classification": 58.0, "eval_rougeL_for_cause_effect_classification": 52.8488, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 54.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.5744, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 66.5884, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 41.8767, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 57.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 58.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 42.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 30.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_textual_entailment": 24.5, "eval_rougeL_for_title_generation": 5.5744, "eval_runtime": 48.6475, "eval_samples_per_second": 71.946, "eval_steps_per_second": 1.131, "step": 13500 }, { "epoch": 1.86, "learning_rate": 5e-05, "loss": 1.0335, "step": 14000 }, { "epoch": 1.86, "eval_exact_match": 49.2286, "eval_exact_match_for_answerability_classification": 62.0, "eval_exact_match_for_cause_effect_classification": 53.3333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 59.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 62.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 1.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 27.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 62.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 17.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 42.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 60.0, "eval_exact_match_for_textual_entailment": 20.0, "eval_exact_match_for_title_generation": 1.0, "eval_f1": 53.4981, "eval_f1_for_answerability_classification": 62.0, "eval_f1_for_cause_effect_classification": 56.6994, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 59.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 62.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 60.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 22.2075, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 69.3948, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 40.587, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_f1_for_task396_persianqa_answerability_classification": 62.0, "eval_f1_for_task463_pasinlu_textual_entailment": 17.0, "eval_f1_for_task464_pasinlu_textual_entailment": 28.2439, "eval_f1_for_task534_farstail_textual_entailment": 42.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 77.0, "eval_f1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 75.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 54.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 77.0, "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_f1_for_textual_entailment": 29.0813, "eval_f1_for_title_generation": 22.2075, "eval_gen_len": 4.2831, "eval_global_step": 14000, "eval_loss": 0.5322003364562988, "eval_rouge1": 50.8699, "eval_rouge1_for_answerability_classification": 62.0, "eval_rouge1_for_cause_effect_classification": 54.3127, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 59.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 62.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 5.5667, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 69.2851, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 40.0959, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 62.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 40.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 42.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rouge1_for_textual_entailment": 27.8333, "eval_rouge1_for_title_generation": 5.5667, "eval_rougeL": 50.8699, "eval_rougeL_for_answerability_classification": 62.0, "eval_rougeL_for_cause_effect_classification": 54.3127, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 59.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 62.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 5.5667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 69.2851, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 56.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 40.0959, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 60.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 62.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 40.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 42.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 58.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 54.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 60.0, "eval_rougeL_for_textual_entailment": 27.8333, "eval_rougeL_for_title_generation": 5.5667, "eval_runtime": 55.1998, "eval_samples_per_second": 63.406, "eval_steps_per_second": 0.996, "step": 14000 }, { "epoch": 1.93, "learning_rate": 5e-05, "loss": 1.0581, "step": 14500 }, { "epoch": 1.93, "eval_exact_match": 49.6857, "eval_exact_match_for_answerability_classification": 60.0, "eval_exact_match_for_cause_effect_classification": 53.9333, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 67.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 64.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 2.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 48.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 33.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 60.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 14.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 44.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 57.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 61.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 66.0, "eval_exact_match_for_textual_entailment": 19.6667, "eval_exact_match_for_title_generation": 2.0, "eval_f1": 53.6169, "eval_f1_for_answerability_classification": 60.0, "eval_f1_for_cause_effect_classification": 57.036, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 67.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 64.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 21.3724, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 63.5684, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 46.0115, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_f1_for_task396_persianqa_answerability_classification": 60.0, "eval_f1_for_task463_pasinlu_textual_entailment": 14.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.1387, "eval_f1_for_task534_farstail_textual_entailment": 44.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 78.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 80.5, "eval_f1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 76.5, "eval_f1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 66.0, "eval_f1_for_textual_entailment": 28.0462, "eval_f1_for_title_generation": 21.3724, "eval_gen_len": 4.0269, "eval_global_step": 14500, "eval_loss": 0.5212923884391785, "eval_rouge1": 51.347, "eval_rouge1_for_answerability_classification": 60.0, "eval_rouge1_for_cause_effect_classification": 54.8696, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 67.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 64.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 6.0571, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 63.5303, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 45.5583, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 60.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 40.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.0, "eval_rouge1_for_task534_farstail_textual_entailment": 44.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 57.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 61.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 66.0, "eval_rouge1_for_textual_entailment": 28.3333, "eval_rouge1_for_title_generation": 6.0571, "eval_rougeL": 51.347, "eval_rougeL_for_answerability_classification": 60.0, "eval_rougeL_for_cause_effect_classification": 54.8696, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 67.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 67.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 61.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 64.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 56.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 6.0571, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 63.5303, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 58.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 45.5583, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 53.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 60.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 40.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.0, "eval_rougeL_for_task534_farstail_textual_entailment": 44.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 57.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 61.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 50.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 66.0, "eval_rougeL_for_textual_entailment": 28.3333, "eval_rougeL_for_title_generation": 6.0571, "eval_runtime": 50.3438, "eval_samples_per_second": 69.522, "eval_steps_per_second": 1.092, "step": 14500 }, { "epoch": 1.99, "learning_rate": 5e-05, "loss": 1.0392, "step": 15000 }, { "epoch": 1.99, "eval_exact_match": 47.5429, "eval_exact_match_for_answerability_classification": 57.0, "eval_exact_match_for_cause_effect_classification": 52.2667, "eval_exact_match_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_exact_match_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_exact_match_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_exact_match_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_exact_match_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_exact_match_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_exact_match_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_exact_match_for_task1561_clickbait_news_bg_title_generation": 3.0, "eval_exact_match_for_task1626_copa_hr_cause_effect_classification": 50.0, "eval_exact_match_for_task1627_copa_hr_cause_effect_classification": 57.0, "eval_exact_match_for_task1628_copa_hr_cause_effect_classification": 30.0, "eval_exact_match_for_task1629_copa_hr_cause_effect_classification": 58.0, "eval_exact_match_for_task396_persianqa_answerability_classification": 57.0, "eval_exact_match_for_task463_pasinlu_textual_entailment": 19.0, "eval_exact_match_for_task464_pasinlu_textual_entailment": 1.0, "eval_exact_match_for_task534_farstail_textual_entailment": 16.0, "eval_exact_match_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_exact_match_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_exact_match_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_exact_match_for_task941_indicnlp_cause_effect_classification": 55.0, "eval_exact_match_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_exact_match_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_exact_match_for_task968_xcopa_cause_effect_classification": 50.0, "eval_exact_match_for_task969_xcopa_cause_effect_classification": 58.0, "eval_exact_match_for_textual_entailment": 12.0, "eval_exact_match_for_title_generation": 3.0, "eval_f1": 51.8895, "eval_f1_for_answerability_classification": 57.0, "eval_f1_for_cause_effect_classification": 55.7605, "eval_f1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_f1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_f1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_f1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_f1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_f1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_f1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_f1_for_task1561_clickbait_news_bg_title_generation": 24.7349, "eval_f1_for_task1626_copa_hr_cause_effect_classification": 68.2892, "eval_f1_for_task1627_copa_hr_cause_effect_classification": 57.0, "eval_f1_for_task1628_copa_hr_cause_effect_classification": 44.5254, "eval_f1_for_task1629_copa_hr_cause_effect_classification": 58.0, "eval_f1_for_task396_persianqa_answerability_classification": 57.0, "eval_f1_for_task463_pasinlu_textual_entailment": 19.0, "eval_f1_for_task464_pasinlu_textual_entailment": 26.5846, "eval_f1_for_task534_farstail_textual_entailment": 16.0, "eval_f1_for_task938_indicnlp_cause_effect_classification": 76.5, "eval_f1_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_f1_for_task940_indicnlp_cause_effect_classification": 76.0, "eval_f1_for_task941_indicnlp_cause_effect_classification": 55.0, "eval_f1_for_task942_indicnlp_cause_effect_classification": 75.5, "eval_f1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_f1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_f1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_f1_for_textual_entailment": 20.5282, "eval_f1_for_title_generation": 24.7349, "eval_gen_len": 4.1929, "eval_global_step": 15000, "eval_loss": 0.5555234551429749, "eval_rouge1": 49.3924, "eval_rouge1_for_answerability_classification": 57.0, "eval_rouge1_for_cause_effect_classification": 53.3372, "eval_rouge1_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rouge1_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_rouge1_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rouge1_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rouge1_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rouge1_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rouge1_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rouge1_for_task1561_clickbait_news_bg_title_generation": 8.1167, "eval_rouge1_for_task1626_copa_hr_cause_effect_classification": 68.1305, "eval_rouge1_for_task1627_copa_hr_cause_effect_classification": 57.0, "eval_rouge1_for_task1628_copa_hr_cause_effect_classification": 43.9862, "eval_rouge1_for_task1629_copa_hr_cause_effect_classification": 58.0, "eval_rouge1_for_task396_persianqa_answerability_classification": 57.0, "eval_rouge1_for_task463_pasinlu_textual_entailment": 46.0, "eval_rouge1_for_task464_pasinlu_textual_entailment": 1.5, "eval_rouge1_for_task534_farstail_textual_entailment": 16.0, "eval_rouge1_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_rouge1_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_rouge1_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_rouge1_for_task941_indicnlp_cause_effect_classification": 55.0, "eval_rouge1_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rouge1_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rouge1_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rouge1_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rouge1_for_textual_entailment": 21.1667, "eval_rouge1_for_title_generation": 8.1167, "eval_rougeL": 49.3795, "eval_rougeL_for_answerability_classification": 57.0, "eval_rougeL_for_cause_effect_classification": 53.3306, "eval_rougeL_for_task1168_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1169_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1170_xcopa_cause_effect_classification": 51.0, "eval_rougeL_for_task1171_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1172_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1173_xcopa_cause_effect_classification": 57.0, "eval_rougeL_for_task1174_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1175_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1176_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1177_xcopa_cause_effect_classification": 49.0, "eval_rougeL_for_task1178_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1179_xcopa_cause_effect_classification": 64.0, "eval_rougeL_for_task1180_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1181_xcopa_cause_effect_classification": 52.0, "eval_rougeL_for_task1182_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1183_xcopa_cause_effect_classification": 53.0, "eval_rougeL_for_task1184_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task1185_xcopa_cause_effect_classification": 55.0, "eval_rougeL_for_task1561_clickbait_news_bg_title_generation": 7.8667, "eval_rougeL_for_task1626_copa_hr_cause_effect_classification": 68.1305, "eval_rougeL_for_task1627_copa_hr_cause_effect_classification": 57.0, "eval_rougeL_for_task1628_copa_hr_cause_effect_classification": 43.7862, "eval_rougeL_for_task1629_copa_hr_cause_effect_classification": 58.0, "eval_rougeL_for_task396_persianqa_answerability_classification": 57.0, "eval_rougeL_for_task463_pasinlu_textual_entailment": 46.0, "eval_rougeL_for_task464_pasinlu_textual_entailment": 1.5, "eval_rougeL_for_task534_farstail_textual_entailment": 16.0, "eval_rougeL_for_task938_indicnlp_cause_effect_classification": 53.0, "eval_rougeL_for_task939_indicnlp_cause_effect_classification": 62.0, "eval_rougeL_for_task940_indicnlp_cause_effect_classification": 52.0, "eval_rougeL_for_task941_indicnlp_cause_effect_classification": 55.0, "eval_rougeL_for_task942_indicnlp_cause_effect_classification": 51.0, "eval_rougeL_for_task943_indicnlp_cause_effect_classification": 57.0, "eval_rougeL_for_task968_xcopa_cause_effect_classification": 50.0, "eval_rougeL_for_task969_xcopa_cause_effect_classification": 58.0, "eval_rougeL_for_textual_entailment": 21.1667, "eval_rougeL_for_title_generation": 7.8667, "eval_runtime": 48.2804, "eval_samples_per_second": 72.493, "eval_steps_per_second": 1.139, "step": 15000 }, { "epoch": 2.0, "step": 15062, "total_flos": 1.5362031529597338e+18, "train_loss": 1.2364440905811966, "train_runtime": 83936.7952, "train_samples_per_second": 2.871, "train_steps_per_second": 0.179 } ], "max_steps": 15062, "num_train_epochs": 2, "total_flos": 1.5362031529597338e+18, "trial_name": null, "trial_params": null }