March07's picture
add transferability information
683d0f6
[
{
"dataset": "cola",
"type": "task",
"origin_acc": 69.2,
"origin_prompt": "Assess the following sentence and determine if it is grammatically correct. Respond with 'Acceptable' or 'Unacceptable':",
"atk_acc": 3.6,
"atk_prompt": "sAsess the ofllowing lsentence and determine if it is grammatiaclly correct. Rspond with 'Acceptable' or 'Unacceptable':",
"transfer_ori_acc": 76.0,
"transfer_atk_acc": 75.5
},
{
"dataset": "cola",
"type": "role",
"origin_acc": 50.6,
"origin_prompt": "In the role of a syntax analyzer, examine the grammar of the provided sentence and decide if it is correct, answering with 'acceptable' for grammatically correct sentences or 'unacceptable' for incorrect ones:",
"atk_acc": 4.8,
"atk_prompt": "n the role of a syntax analyzer, examine the grammar of the provided sentence and decide if it is correct, answering with 'acceptable' for grammatically correct sentences or 'unacceptable' for incorret oKnes:",
"transfer_ori_acc": 79.0,
"transfer_atk_acc": 77.5
},
{
"dataset": "mrpc",
"type": "task",
"origin_acc": 57.84,
"origin_prompt": "Compare the following sentences and determine if they share the same semantic meaning by responding with 'equivalent' or 'not_equivalent'.",
"atk_acc": 0.0,
"atk_prompt": "oCmpare the follAwing sentewces and determine if they share the same swmantic meaning by responding with 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 74.0,
"transfer_atk_acc": 71.5
},
{
"dataset": "mrpc",
"type": "role",
"origin_acc": 52.21,
"origin_prompt": "In your capacity as a semantic comparison tool, examine the given sentences and decide if their meanings are identical, responding with 'equivalent' or 'not_equivalent'.",
"atk_acc": 1.47,
"atk_prompt": "IYn your capaciMy as a semantic comparison ool, examine the given sentences and deXide if their meanings are identRcal, rseponding with 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 75.0,
"transfer_atk_acc": 73.0
},
{
"dataset": "qnli",
"type": "task",
"origin_acc": 30.5,
"origin_prompt": "Review the given context and question, and decide if the context contains enough information to support the answer by selecting 'entailment' or 'not_entailment'.",
"atk_acc": 4.7,
"atk_prompt": "Rview the gven cnotext and question, and edcide if the context containZs enough information to Vsupport the ainswer by selecting 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 65.0,
"transfer_atk_acc": 68.5
},
{
"dataset": "qnli",
"type": "role",
"origin_acc": 35.3,
"origin_prompt": "As a language expert, assess if the given context entails the answer to the question and respond with 'entailment' or 'not_entailment'.",
"atk_acc": 2.1,
"atk_prompt": "As a language epxert, arssess if the gien contet entaxls the ansGer to the questAon and resNpond with 'entailment' or 'not_entailment'. ",
"transfer_ori_acc": 72.0,
"transfer_atk_acc": 77.5
},
{
"dataset": "qqp",
"type": "task",
"origin_acc": 24.1,
"origin_prompt": "Analyze if the given set of sentences have the same connotation by answering with 'equivalent' or 'not_equivalent'.",
"atk_acc": 2.0,
"atk_prompt": "tAnalyze if the giCen est of sentUnces have the same connotatioq by answering with 'equivalent' or 'not_equivalent'. ",
"transfer_ori_acc": 79.0,
"transfer_atk_acc": 80.0
},
{
"dataset": "qqp",
"type": "role",
"origin_acc": 16.9,
"origin_prompt": "In the role of a question similarity analyzer, examine the meaning of the provided questions and decide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for different questions.",
"atk_acc": 0.7,
"atk_prompt": "IZn the role of a questoion similarity naalyzer, examin the meJaning of the provided questions and Uecide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for dSfferent questioXns. ",
"transfer_ori_acc": 81.5,
"transfer_atk_acc": 81.0
},
{
"dataset": "rte",
"type": "task",
"origin_acc": 41.16,
"origin_prompt": "Determine if the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment'.",
"atk_acc": 1.08,
"atk_prompt": "DetermiCne if the givePn pir of sentcnces disWlays entailment or not_entailment. Rtspond with 'entailment' or 'not_entailment'.",
"transfer_ori_acc": 82.5,
"transfer_atk_acc": 81.0
},
{
"dataset": "rte",
"type": "role",
"origin_acc": 49.82,
"origin_prompt": "Working as an entailment classifier, identify whether the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment':",
"atk_acc": 1.08,
"atk_prompt": "orking as an entailment clasifier, idenStify whethre the givec ptair of sentInces displays entailment or not_entailment. ReKspond with 'entailment' or 'not_entailment':",
"transfer_ori_acc": 81.0,
"transfer_atk_acc": 78.5
},
{
"dataset": "sst2",
"type": "task",
"origin_acc": 48.05,
"origin_prompt": "After examining the following expression, label its emotion as either 'positive' or 'negative':",
"atk_acc": 0.8,
"atk_prompt": "kfter eximining the followinM expression, labe its emolion as egther 'positive' or 'negative': ",
"transfer_ori_acc": 90.0,
"transfer_atk_acc": 86.5
},
{
"dataset": "sst2",
"type": "role",
"origin_acc": 41.06,
"origin_prompt": "Functioning as a sentiment identification tool, assess if the following expression is 'positive' or 'negative'. Classify:",
"atk_acc": 27.18,
"atk_prompt": "Functionnig as a sentiment identification tool, assess if the flolowing xepression is 'positive' or 'negative'. ClUssify: ",
"transfer_ori_acc": 92.0,
"transfer_atk_acc": 90.0
},
{
"dataset": "wnli",
"type": "task",
"origin_acc": 43.66,
"origin_prompt": "Determine if the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment'.",
"atk_acc": 0.0,
"atk_prompt": "VDetermine if the giPen Apair of setences displUays entailment or not_entailment. QRespond with 'entailment' or 'not_entailment'.",
"transfer_ori_acc": 61.97183098591549,
"transfer_atk_acc": 63.38028169014085
},
{
"dataset": "wnli",
"type": "role",
"origin_acc": 43.66,
"origin_prompt": "In your role as an entailment analysis tool, assess the relationship between the given sentences and classify it as 'entailment' or 'not_entailment':",
"atk_acc": 0.0,
"atk_prompt": "kn your rohe as an entailment analysis tool, Zassess the relationship between the gUiven saentences and clasFsify it as 'entailment' or 'not_entailment':",
"transfer_ori_acc": 52.112676056338024,
"transfer_atk_acc": 47.88732394366197
},
{
"dataset": "mmlu",
"type": "task",
"origin_acc": 25.67,
"origin_prompt": "Evaluate the multiple-choice question about {} and select the most fitting response from 'A', 'B', 'C', or 'D'.",
"atk_acc": 14.7,
"atk_prompt": "Evaluate the multple-choice question about {} and elect the most fitting respone from 'A', 'B', 'C', or 'D'. ",
"transfer_ori_acc": 57.49999999999999,
"transfer_atk_acc": 60.0
},
{
"dataset": "mmlu",
"type": "role",
"origin_acc": 25.09,
"origin_prompt": "As a knowledgeable individual in {}, provide your response to the multiple-choice question by choosing 'A', 'B', 'C', or 'D'.",
"atk_acc": 16.45,
"atk_prompt": "As a kAnowledgeable indviidual in {}, provide your ersponse to the multipole-choice quesxion by choosing 'A', 'B', 'C', or 'D'.",
"transfer_ori_acc": 60.0,
"transfer_atk_acc": 61.0
}
]