Spaces:
Runtime error
Runtime error
[ | |
{ | |
"dataset": "cola", | |
"type": "translation", | |
"origin_acc": 81.5, | |
"origin_prompt": "Functioning as a grammar evaluation tool, analyze the given sentence and decide if it is grammatically correct, responding with 'acceptable' or 'unacceptable'.", | |
"atk_acc": 68.5, | |
"atk_prompt": "Classify the grammar of a given sentence as 'acceptable' or 'unacceptable', and judge its accuracy.", | |
"transfer_ori_acc": 75.2, | |
"transfer_atk_acc": 75.8 | |
}, | |
{ | |
"dataset": "mrpc", | |
"type": "translation", | |
"origin_acc": 74.5, | |
"origin_prompt": "Compare the following sentences and determine if they share the same semantic meaning by responding with 'equivalent' or 'not_equivalent'.", | |
"atk_acc": 65.0, | |
"atk_prompt": "Based on my experience in semantic analysis, classify the following two sentences between 'equivalent' or 'not_equivalent'.", | |
"transfer_ori_acc": 80.3921568627451, | |
"transfer_atk_acc": 81.61764705882352 | |
}, | |
{ | |
"dataset": "qnli", | |
"type": "translation", | |
"origin_acc": 86.0, | |
"origin_prompt": "As a textual analyst, examine if the given context logically implies the answer to the question and indicate your decision with 'entailment' or 'not_entailment'.", | |
"atk_acc": 71.5, | |
"atk_prompt": "Check the text link to the question and answer 'entailment' or 'not_entailment', depending on your language skills.", | |
"transfer_ori_acc": 88.8, | |
"transfer_atk_acc": 56.699999999999996 | |
}, | |
{ | |
"dataset": "qqp", | |
"type": "translation", | |
"origin_acc": 84.0, | |
"origin_prompt": "In the capacity of a question assessment system, indicate if the meaning of the provided questions is the same, responding with 'equivalent' or 'not_equivalent'.", | |
"atk_acc": 80.5, | |
"atk_prompt": "By analyzing the similarity of these problems, they are divided into categories of 'equivalent' or 'not_equivalent'.", | |
"transfer_ori_acc": 86.1, | |
"transfer_atk_acc": 87.5 | |
}, | |
{ | |
"dataset": "rte", | |
"type": "translation", | |
"origin_acc": 84.5, | |
"origin_prompt": "Does the relationship between the given sentences represent entailment or not_entailment? Respond with 'entailment' or 'not_entailment'.", | |
"atk_acc": 80.0, | |
"atk_prompt": "Determine whether the given sentences have a cause-effect relationship as an engagement analysis tool and categorize them as 'entailment' or 'not_entailment'.", | |
"transfer_ori_acc": 83.75451263537906, | |
"transfer_atk_acc": 84.47653429602889 | |
}, | |
{ | |
"dataset": "sst2", | |
"type": "translation", | |
"origin_acc": 97.5, | |
"origin_prompt": "In the capacity of a sentiment classifier, decide whether the given quote is 'positive' or 'negative'.", | |
"atk_acc": 68.5, | |
"atk_prompt": "In the context of textual analysis, what classification is this phrase between 'positive' and 'negative'?", | |
"transfer_ori_acc": 94.95412844036697, | |
"transfer_atk_acc": 94.61009174311926 | |
}, | |
{ | |
"dataset": "wnli", | |
"type": "translation", | |
"origin_acc": 74.65, | |
"origin_prompt": "Are the following two sentences entailment or not_entailment? Answer me with \"entailment\" or \"not_entailment\", just one word.", | |
"atk_acc": 59.15, | |
"atk_prompt": "Determinate the semantic connections of a given sentence and classify it as 'entailment' or 'not_entailment'.", | |
"transfer_ori_acc": 67.6056338028169, | |
"transfer_atk_acc": 54.929577464788736 | |
}, | |
{ | |
"dataset": "mmlu", | |
"type": "translation", | |
"origin_acc": 67.0, | |
"origin_prompt": "Please respond to the multiple-choice question about {} by selecting the appropriate answer: 'A', 'B', 'C', or 'D'.", | |
"atk_acc": 63.0, | |
"atk_prompt": "Rate your understanding of the multiple-choice question on {}. Choose the correct answer from options 'A', 'B', 'C' or 'D'.", | |
"transfer_ori_acc": 45.21276595744681, | |
"transfer_atk_acc": 45.56737588652482 | |
}, | |
{ | |
"dataset": "squad_v2", | |
"type": "translation", | |
"origin_acc": 74.58, | |
"origin_prompt": "Please derive the most fitting answer from the context. If there isn't an answer in the context, use 'unanswerable'.", | |
"atk_acc": 67.46, | |
"atk_prompt": "Please provide additional information about the facts mentioned in this sentence. If no information is available, respond with 'unanswerable'.", | |
"transfer_ori_acc": 87.04992770387507, | |
"transfer_atk_acc": 86.92265497660236 | |
}, | |
{ | |
"dataset": "iwslt", | |
"type": "translation", | |
"origin_acc": 0.24, | |
"origin_prompt": "Convert the following sentence from its original {} language to the target language {}.", | |
"atk_acc": 0.17, | |
"atk_prompt": "Please translate the sentences below into {}, then {}.", | |
"transfer_ori_acc": 0.2240211126734209, | |
"transfer_atk_acc": 0.20150103267232944 | |
}, | |
{ | |
"dataset": "un_multi", | |
"type": "translation", | |
"origin_acc": 0.36, | |
"origin_prompt": "Translate the following text from the source language {} to the target language {}.", | |
"atk_acc": 0.25, | |
"atk_prompt": "Please translate the following sentences into {}, then {}.", | |
"transfer_ori_acc": 0.3090347352409074, | |
"transfer_atk_acc": 0.3050833075162871 | |
}, | |
{ | |
"dataset": "math", | |
"type": "translation", | |
"origin_acc": 23.12, | |
"origin_prompt": "Compute the result of this math task concerning {}.", | |
"atk_acc": 18.75, | |
"atk_prompt": "Please calculate the answers related to {}.", | |
"transfer_ori_acc": 16.25, | |
"transfer_atk_acc": 16.875 | |
} | |
] |