File size: 4,150 Bytes
683d0f6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
[
    {
        "dataset": "cola",
        "type": "translation",
        "origin_acc": 81.5,
        "origin_prompt": "Functioning as a grammar evaluation tool, analyze the given sentence and decide if it is grammatically correct, responding with 'acceptable' or 'unacceptable'.",
        "atk_acc": 68.5,
        "atk_prompt": "Classify the grammar of a given sentence as 'acceptable' or 'unacceptable', and judge its accuracy.",
        "transfer_ori_acc": 23.9,
        "transfer_atk_acc": 28.7
    },
    {
        "dataset": "mrpc",
        "type": "translation",
        "origin_acc": 74.5,
        "origin_prompt": "Compare the following sentences and determine if they share the same semantic meaning by responding with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 65.0,
        "atk_prompt": "Based on my experience in semantic analysis, classify the following two sentences between 'equivalent' or 'not_equivalent'.",
        "transfer_ori_acc": 62.254901960784316,
        "transfer_atk_acc": 60.5392156862745
    },
    {
        "dataset": "qnli",
        "type": "translation",
        "origin_acc": 86.0,
        "origin_prompt": "As a textual analyst, examine if the given context logically implies the answer to the question and indicate your decision with 'entailment' or 'not_entailment'.",
        "atk_acc": 71.5,
        "atk_prompt": "Check the text link to the question and answer 'entailment' or 'not_entailment', depending on your language skills.",
        "transfer_ori_acc": 31.4,
        "transfer_atk_acc": 2.0
    },
    {
        "dataset": "qqp",
        "type": "translation",
        "origin_acc": 84.0,
        "origin_prompt": "In the capacity of a question assessment system, indicate if the meaning of the provided questions is the same, responding with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 80.5,
        "atk_prompt": "By analyzing the similarity of these problems, they are divided into categories of 'equivalent' or 'not_equivalent'.",
        "transfer_ori_acc": 46.9,
        "transfer_atk_acc": 37.6
    },
    {
        "dataset": "rte",
        "type": "translation",
        "origin_acc": 84.5,
        "origin_prompt": "Does the relationship between the given sentences represent entailment or not_entailment? Respond with 'entailment' or 'not_entailment'.",
        "atk_acc": 80.0,
        "atk_prompt": "Determine whether the given sentences have a cause-effect relationship as an engagement analysis tool and categorize them as 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 46.20938628158845,
        "transfer_atk_acc": 23.465703971119133
    },
    {
        "dataset": "sst2",
        "type": "translation",
        "origin_acc": 97.5,
        "origin_prompt": "In the capacity of a sentiment classifier, decide whether the given quote is 'positive' or 'negative'.",
        "atk_acc": 68.5,
        "atk_prompt": "In the context of textual analysis, what classification is this phrase between 'positive' and 'negative'?",
        "transfer_ori_acc": 20.18348623853211,
        "transfer_atk_acc": 32.798165137614674
    },
    {
        "dataset": "wnli",
        "type": "translation",
        "origin_acc": 74.65,
        "origin_prompt": "Are the following two sentences entailment or not_entailment? Answer me with \"entailment\" or \"not_entailment\", just one word.",
        "atk_acc": 59.15,
        "atk_prompt": "Determinate the semantic connections of a given sentence and classify it as 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 33.80281690140845,
        "transfer_atk_acc": 4.225352112676056
    },
    {
        "dataset": "mmlu",
        "type": "translation",
        "origin_acc": 67.0,
        "origin_prompt": "Please respond to the multiple-choice question about {} by selecting the appropriate answer: 'A', 'B', 'C', or 'D'.",
        "atk_acc": 63.0,
        "atk_prompt": "Rate your understanding of the multiple-choice question on {}. Choose the correct answer from options 'A', 'B', 'C' or 'D'.",
        "transfer_ori_acc": 8.865248226950355,
        "transfer_atk_acc": 8.156028368794328
    }
]