March07's picture
add transferability information
683d0f6
raw
history blame
8.37 kB
[
{
"dataset": "cola",
"type": "task",
"origin_acc": 62.0,
"origin_prompt": "Assess the grammatical structure of the given sentence and classify it as 'Acceptable' or 'Unacceptable'.",
"atk_acc": 11.4,
"atk_prompt": "Assess the grammatcal etructure of the given entence and classif it as 'Acceptable' or 'Unacceptable'. ",
"transfer_ori_acc": 76.3,
"transfer_atk_acc": 77.9
},
{
"dataset": "cola",
"type": "role",
"origin_acc": 35.1,
"origin_prompt": "Working as a grammar classifier, identify whether the given sentence has correct grammar, and respond with 'acceptable' for correct sentences or 'unacceptable' for incorrect ones.",
"atk_acc": 0.0,
"atk_prompt": "Working as a grammar clsasifier, identify whether the given sentence has correct grammar, and reszond with 'acceptable' for correct sentences or 'unacceptable' for incorrect noes. ",
"transfer_ori_acc": 75.4,
"transfer_atk_acc": 74.7
},
{
"dataset": "mrpc",
"type": "task",
"origin_acc": 67.65,
"origin_prompt": "Do the meanings of these two statements align? Indicate your answer with 'equivalent' or 'not_equivalent'.",
"atk_acc": 36.76,
"atk_prompt": "Zo the meanings of these Xwo statements Ualign? IndicNte your answeY with 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 81.86274509803921,
"transfer_atk_acc": 81.61764705882352
},
{
"dataset": "mrpc",
"type": "role",
"origin_acc": 69.12,
"origin_prompt": "In your capacity as a semantic assessment tool, evaluate the provided sentences and classify their meanings as 'equivalent' or 'not_equivalent'.",
"atk_acc": 34.31,
"atk_prompt": "nI your capacitCy as a sebmantic assgssment otol, evaluate the provided sentenceAs and Zlassify their meaniPgs as 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 75.24509803921569,
"transfer_atk_acc": 79.41176470588235
},
{
"dataset": "qnli",
"type": "task",
"origin_acc": 42.7,
"origin_prompt": "Review the given context and question, and decide if the context contains enough information to support the answer by selecting 'entailment' or 'not_entailment'.",
"atk_acc": 0.2,
"atk_prompt": "RevTiew the ginen cEntext and uestion, and decid if the context conatains enough iformation to uspport the answVer by selectin 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 85.2,
"transfer_atk_acc": 69.5
},
{
"dataset": "qnli",
"type": "role",
"origin_acc": 42.9,
"origin_prompt": "As a linguistic consultant, decide if the answer to the question is logically supported by the provided context and respond with 'entailment' or 'not_entailment'.",
"atk_acc": 1.8,
"atk_prompt": "Abs a linguistic consultant, decide if the answer to the question is logically supported by the provided Aontext and respGond with 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 85.1,
"transfer_atk_acc": 88.4
},
{
"dataset": "qqp",
"type": "task",
"origin_acc": 38.1,
"origin_prompt": "Assess whether the following statements are identical in meaning by answering 'equivalent' or 'not_equivalent'.",
"atk_acc": 20.3,
"atk_prompt": "Asess hwether the following statemets are identiacl in meaning by answerinEg 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 86.9,
"transfer_atk_acc": 84.8
},
{
"dataset": "qqp",
"type": "role",
"origin_acc": 33.6,
"origin_prompt": "In your role as a question comparison tool, assess the following pair of questions and classify them as 'equivalent' or 'not_equivalent'.",
"atk_acc": 23.6,
"atk_prompt": "In your Irole as a questioGn comparison tolo, ussess the foMlowing pair of questrions and classify them as 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 85.2,
"transfer_atk_acc": 87.3
},
{
"dataset": "rte",
"type": "task",
"origin_acc": 50.54,
"origin_prompt": "Are the following two sentences entailment or not_entailment? Answer me with \"entailment\" or \"not_entailment\", just one word.",
"atk_acc": 0.36,
"atk_prompt": "Aer the following wto sentences entailment or not_entailment? Answer me with \"entailment\" or \"not_entailment\", just one wor. ",
"transfer_ori_acc": 85.5595667870036,
"transfer_atk_acc": 81.94945848375451
},
{
"dataset": "rte",
"type": "role",
"origin_acc": 36.82,
"origin_prompt": "In the role of a semantic relationship analyzer, examine the connection between the given sentences and decide if they exhibit entailment or not_entailment. Answer with 'entailment' or 'not_entailment'.",
"atk_acc": 1.08,
"atk_prompt": "In the role of a semgntic relationship anayzer, examin the connection between the given sentences and decide if they exhibit entailment or not_entailment. AnCwer with 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 81.2274368231047,
"transfer_atk_acc": 81.94945848375451
},
{
"dataset": "sst2",
"type": "task",
"origin_acc": 14.45,
"origin_prompt": "Review this statement and decide whether it has a 'positive' or 'negative' sentiment.",
"atk_acc": 0.0,
"atk_prompt": "GReview this stateent and decide wdether it has a 'positive' or 'negative' sentiment. ",
"transfer_ori_acc": 95.18348623853211,
"transfer_atk_acc": 94.95412844036697
},
{
"dataset": "sst2",
"type": "role",
"origin_acc": 26.49,
"origin_prompt": "In the role of a sentiment analysis tool, respond with 'positive' or 'negative' to classify this statement.",
"atk_acc": 0.0,
"atk_prompt": "In the ole of a senteiment naalysis tool, resond with 'positive' or 'negative' to classfy this sattement. ",
"transfer_ori_acc": 95.52752293577981,
"transfer_atk_acc": 95.52752293577981
},
{
"dataset": "wnli",
"type": "task",
"origin_acc": 23.94,
"origin_prompt": "Does the relationship between the given sentences represent entailment or not_entailment? Respond with 'entailment' or 'not_entailment'.",
"atk_acc": 0.0,
"atk_prompt": "SDoes the relationship between the given stentences represent entailment or not_entailment? ResYond with 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 63.38028169014085,
"transfer_atk_acc": 67.6056338028169
},
{
"dataset": "wnli",
"type": "role",
"origin_acc": 16.9,
"origin_prompt": "In your role as an entailment analysis tool, assess the relationship between the given sentences and classify it as 'entailment' or 'not_entailment'.",
"atk_acc": 0.0,
"atk_prompt": "mn your roye as an entailment aunalysis tooS, assess the relationship between the given sentences and classify it as 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 57.74647887323944,
"transfer_atk_acc": 61.97183098591549
},
{
"dataset": "mmlu",
"type": "task",
"origin_acc": 10.15,
"origin_prompt": "In relation to the multiple-choice question on {}, please provide the accurate answer by choosing 'A', 'B', 'C', or 'D'.",
"atk_acc": 3.5,
"atk_prompt": "oIn relatin to the mhltiple-choice question on {}, plese provide the accurate answer by choosing 'A', 'B', 'C', or 'D'. ",
"transfer_ori_acc": 46.808510638297875,
"transfer_atk_acc": 44.50354609929078
},
{
"dataset": "mmlu",
"type": "role",
"origin_acc": 9.8,
"origin_prompt": "With your knowledge of {}, tackle the following multiple-choice question by choosing 'A', 'B', 'C', or 'D'.",
"atk_acc": 6.07,
"atk_prompt": "With your knowlegde of {}, tacke the folloing mulBiple-choice question by choosing 'A', 'B', 'C', or 'D'.",
"transfer_ori_acc": 46.09929078014184,
"transfer_atk_acc": 45.0354609929078
}
]