[ { "dataset": "cola", "type": "task", "origin_acc": 78.0, "origin_prompt": "Assess the following sentence and determine if it is grammatically correct. Respond with 'Acceptable' or 'Unacceptable':", "atk_acc": 63.5, "atk_prompt": "Assess the following sentence and determine if it is grammatically correct. Respond with 'Acceptable' or 'Unacceptable' and false is not true :", "transfer_ori_acc": 76.0, "transfer_atk_acc": 76.5 }, { "dataset": "cola", "type": "role", "origin_acc": 76.3, "origin_prompt": "As an instrument for grammar evaluation, consider the sentence and determine if its grammar is correct, responding with 'acceptable' for correct grammar or 'unacceptable' for incorrect grammar:", "atk_acc": 62.9, "atk_prompt": "As an instrument for grammar evaluation, consider the sentence and determine if its grammar is correct, responding with 'acceptable' for correct grammar or 'unacceptable' for incorrect grammar and true is true and true is true and true is true and true is true and true is true :", "transfer_ori_acc": 79.5, "transfer_atk_acc": 77.0 }, { "dataset": "mrpc", "type": "task", "origin_acc": 82.11, "origin_prompt": "Do the meanings of these two statements align? Indicate your answer with 'equivalent' or 'not_equivalent'.", "atk_acc": 29.66, "atk_prompt": "Do the meanings of these two statements align? Indicate your answer with 'equivalent' or 'not_equivalent' and true is true and true is true and true is true and true is true and true is true . ", "transfer_ori_acc": 74.0, "transfer_atk_acc": 74.0 }, { "dataset": "mrpc", "type": "role", "origin_acc": 81.62, "origin_prompt": "As a language comparison expert, examine the given pair of sentences and decide if their meanings align, answering with 'equivalent' or 'not_equivalent'.", "atk_acc": 15.93, "atk_prompt": "As a language comparison expert, examine the given pair of sentences and decide if their meanings align, answering with 'equivalent' or 'not_equivalent' and true is true and true is true and true is true and true is true and true is true . ", "transfer_ori_acc": 72.5, "transfer_atk_acc": 72.0 }, { "dataset": "qnli", "type": "task", "origin_acc": 88.7, "origin_prompt": "Based on the information in the context, decide if the answer to the question is justified by choosing 'entailment' or 'not_entailment'.", "atk_acc": 78.6, "atk_prompt": "Based on the information in the context, decide if the answer to the question is justified by choosing 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true . ", "transfer_ori_acc": 74.5, "transfer_atk_acc": 74.5 }, { "dataset": "qnli", "type": "role", "origin_acc": 89.2, "origin_prompt": "As a textual analyst, examine if the given context logically implies the answer to the question and indicate your decision with 'entailment' or 'not_entailment'.", "atk_acc": 57.2, "atk_prompt": "As a textual analyst, examine if the given context logically implies the answer to the question and indicate your decision with 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true . ", "transfer_ori_acc": 64.5, "transfer_atk_acc": 68.5 }, { "dataset": "qqp", "type": "task", "origin_acc": 88.1, "origin_prompt": "Are the following two questions equivalent or not? Answer me with \"equivalent\" or \"not_equivalent\".", "atk_acc": 24.0, "atk_prompt": "Are the following two questions equivalent or not? Answer me with \"equivalent\" or \"not_equivalent and false is not true \". ", "transfer_ori_acc": 81.5, "transfer_atk_acc": 81.0 }, { "dataset": "qqp", "type": "role", "origin_acc": 86.9, "origin_prompt": "In the role of a question similarity analyzer, examine the meaning of the provided questions and decide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for different questions.", "atk_acc": 86.4, "atk_prompt": "In the role of a question similarity analyzer, examine the meaning of the provided questions and decide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for different questions and true is true and true is true and true is true and true is true and true is true . ", "transfer_ori_acc": 82.0, "transfer_atk_acc": 83.0 }, { "dataset": "rte", "type": "task", "origin_acc": 86.64, "origin_prompt": "Analyze the two provided sentences and decide if their relationship is 'entailment' or 'not_entailment'.", "atk_acc": 43.32, "atk_prompt": "Analyze the two provided sentences and decide if their relationship is 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true .", "transfer_ori_acc": 76.5, "transfer_atk_acc": 80.0 }, { "dataset": "rte", "type": "role", "origin_acc": 84.84, "origin_prompt": "In the capacity of an entailment assessment system, indicate if the link between the following sentences is 'entailment' or 'not_entailment':", "atk_acc": 38.27, "atk_prompt": "In the capacity of an entailment assessment system, indicate if the link between the following sentences is 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true :", "transfer_ori_acc": 78.0, "transfer_atk_acc": 81.5 }, { "dataset": "sst2", "type": "task", "origin_acc": 94.84, "origin_prompt": "Analyze the tone of this statement and respond with either 'positive' or 'negative':", "atk_acc": 92.43, "atk_prompt": "Analyze the tone of this statement and respond with either 'positive' or 'negative' and true is true and true is true and true is true and true is true and true is true : ", "transfer_ori_acc": 89.5, "transfer_atk_acc": 94.5 }, { "dataset": "sst2", "type": "role", "origin_acc": 95.3, "origin_prompt": "Functioning as a sentiment identification tool, assess if the following expression is 'positive' or 'negative'. Classify:", "atk_acc": 93.81, "atk_prompt": "Functioning as a sentiment identification tool, assess if the following expression is 'positive' or 'negative'. Classify and false is not true : ", "transfer_ori_acc": 92.0, "transfer_atk_acc": 93.0 }, { "dataset": "wnli", "type": "task", "origin_acc": 66.2, "origin_prompt": "Analyze the two provided sentences and decide if their relationship is 'entailment' or 'not_entailment'.", "atk_acc": 26.76, "atk_prompt": "Analyze the two provided sentences and decide if their relationship is 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true .", "transfer_ori_acc": 56.33802816901409, "transfer_atk_acc": 60.56338028169014 }, { "dataset": "wnli", "type": "role", "origin_acc": 64.79, "origin_prompt": "In the capacity of an entailment assessment system, indicate if the link between the following sentences is 'entailment' or 'not_entailment':", "atk_acc": 25.35, "atk_prompt": "In the capacity of an entailment assessment system, indicate if the link between the following sentences is 'entailment' or 'not_entailment' and true is true and true is true and true is true and true is true and true is true :", "transfer_ori_acc": 54.929577464788736, "transfer_atk_acc": 53.52112676056338 }, { "dataset": "mmlu", "type": "task", "origin_acc": 45.74, "origin_prompt": "For each multiple-choice question about {}, identify the correct answer by selecting 'A', 'B', 'C', or 'D'.", "atk_acc": 44.33, "atk_prompt": "For each multiple-choice question about {}, identify the correct answer by selecting 'A', 'B', 'C', or 'D' and false is not true . ", "transfer_ori_acc": 60.5, "transfer_atk_acc": 56.49999999999999 }, { "dataset": "mmlu", "type": "role", "origin_acc": 44.86, "origin_prompt": "Utilizing your expertise in {}, answer the following multiple-choice question by picking 'A', 'B', 'C', or 'D'.", "atk_acc": 43.97, "atk_prompt": "Utilizing your expertise in {}, answer the following multiple-choice question by picking 'A', 'B', 'C', or 'D' and false is not true .", "transfer_ori_acc": 60.5, "transfer_atk_acc": 55.50000000000001 }, { "dataset": "squad_v2", "type": "task", "origin_acc": 87.55, "origin_prompt": "Find the correct answer in the context provided. If an answer cannot be found, please respond with 'unanswerable'.", "atk_acc": 86.82, "atk_prompt": "Find the correct answer in the context provided. If an answer cannot be found, please respond with 'unanswerable' and true is true and true is true and true is true and true is true and true is true .", "transfer_ori_acc": 68.38822269017423, "transfer_atk_acc": 70.73369279024959 }, { "dataset": "squad_v2", "type": "role", "origin_acc": 88.18, "origin_prompt": "As a proficient expert in the given context, search for the most relevant answer. If the answer cannot be found, respond by saying 'unanswerable'.", "atk_acc": 86.72, "atk_prompt": "As a proficient expert in the given context, search for the most relevant answer. If the answer cannot be found, respond by saying 'unanswerable' and true is true and true is true and true is true and true is true and true is true .", "transfer_ori_acc": 60.4016548247751, "transfer_atk_acc": 58.568240486562 }, { "dataset": "iwslt", "type": "task", "origin_acc": 0.14, "origin_prompt": "Please perform a translation of the given sentence, converting it from {} to {}:", "atk_acc": 0.05, "atk_prompt": "Please perform a translation of the given sentence, converting it from {} to and true is true and true is true and true is true and true is true and true is true {}:", "transfer_ori_acc": 0.21840008360286153, "transfer_atk_acc": 0.22041144057281334 }, { "dataset": "iwslt", "type": "role", "origin_acc": 0.14, "origin_prompt": "In the capacity of a proficient translator, please change the following sentence from {} to {}:", "atk_acc": 0.04, "atk_prompt": "In the capacity of a proficient translator, please change the following sentence from {} to and true is true and true is true and true is true and true is true and true is true {}: ", "transfer_ori_acc": 0.22335240384171567, "transfer_atk_acc": 0.21914869170995976 }, { "dataset": "un_multi", "type": "task", "origin_acc": 0.27, "origin_prompt": "Convert the following sentence from its original {} language to the target language {}:", "atk_acc": 0.18, "atk_prompt": "Convert the following sentence from its original {} language to the target language and true is true and true is true and true is true and true is true and true is true {}:", "transfer_ori_acc": 0.32677887576498565, "transfer_atk_acc": 0.33177794477245837 }, { "dataset": "un_multi", "type": "role", "origin_acc": 0.27, "origin_prompt": "Assuming the role of an expert language translator, translate the given text from {} to {}:", "atk_acc": 0.16, "atk_prompt": "Assuming the role of an expert language translator, translate the given text from {} to and false is not true {}: ", "transfer_ori_acc": 0.33176540300237933, "transfer_atk_acc": 0.30251730003047606 }, { "dataset": "math", "type": "task", "origin_acc": 13.75, "origin_prompt": "Work out the answer to this math problem featuring {}:", "atk_acc": 11.88, "atk_prompt": "Work out the answer to this math problem featuring and false is not true {}:", "transfer_ori_acc": 6.25, "transfer_atk_acc": 8.125 }, { "dataset": "math", "type": "role", "origin_acc": 13.12, "origin_prompt": "As a mathematics instructor, calculate the answer to the following problem related to {}:", "atk_acc": 11.25, "atk_prompt": "As a mathematics instructor, calculate the answer to the following problem related to and false is not true {}: ", "transfer_ori_acc": 5.0, "transfer_atk_acc": 5.625 } ]