File size: 8,700 Bytes
683d0f6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
[
    {
        "dataset": "cola",
        "type": "task",
        "origin_acc": 69.2,
        "origin_prompt": "Assess the following sentence and determine if it is grammatically correct. Respond with 'Acceptable' or 'Unacceptable':",
        "atk_acc": 3.6,
        "atk_prompt": "sAsess the ofllowing lsentence and determine if it is grammatiaclly correct. Rspond with 'Acceptable' or 'Unacceptable':",
        "transfer_ori_acc": 78.0,
        "transfer_atk_acc": 73.7
    },
    {
        "dataset": "cola",
        "type": "role",
        "origin_acc": 50.6,
        "origin_prompt": "In the role of a syntax analyzer, examine the grammar of the provided sentence and decide if it is correct, answering with 'acceptable' for grammatically correct sentences or 'unacceptable' for incorrect ones:",
        "atk_acc": 4.8,
        "atk_prompt": "n the role of a syntax analyzer, examine the grammar of the provided sentence and decide if it is correct, answering with 'acceptable' for grammatically correct sentences or 'unacceptable' for incorret oKnes:",
        "transfer_ori_acc": 74.9,
        "transfer_atk_acc": 73.6
    },
    {
        "dataset": "mrpc",
        "type": "task",
        "origin_acc": 57.84,
        "origin_prompt": "Compare the following sentences and determine if they share the same semantic meaning by responding with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 0.0,
        "atk_prompt": "oCmpare the follAwing sentewces and determine if they share the same swmantic meaning by responding with 'equivalent' or 'not_equivalent'. ",
        "transfer_ori_acc": 82.1078431372549,
        "transfer_atk_acc": 81.61764705882352
    },
    {
        "dataset": "mrpc",
        "type": "role",
        "origin_acc": 52.21,
        "origin_prompt": "In your capacity as a semantic comparison tool, examine the given sentences and decide if their meanings are identical, responding with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 1.47,
        "atk_prompt": "IYn your capaciMy as a semantic comparison ool, examine the given sentences and deXide if their meanings are identRcal, rseponding with 'equivalent' or 'not_equivalent'. ",
        "transfer_ori_acc": 83.33333333333334,
        "transfer_atk_acc": 80.3921568627451
    },
    {
        "dataset": "qnli",
        "type": "task",
        "origin_acc": 30.5,
        "origin_prompt": "Review the given context and question, and decide if the context contains enough information to support the answer by selecting 'entailment' or 'not_entailment'.",
        "atk_acc": 4.7,
        "atk_prompt": "Rview the gven cnotext and question, and edcide if the context containZs enough information to Vsupport the ainswer by selecting 'entailment' or 'not_entailment'. ",
        "transfer_ori_acc": 85.2,
        "transfer_atk_acc": 88.1
    },
    {
        "dataset": "qnli",
        "type": "role",
        "origin_acc": 35.3,
        "origin_prompt": "As a language expert, assess if the given context entails the answer to the question and respond with 'entailment' or 'not_entailment'.",
        "atk_acc": 2.1,
        "atk_prompt": "As a language epxert, arssess if the gien contet entaxls the ansGer to the questAon and resNpond with 'entailment' or 'not_entailment'. ",
        "transfer_ori_acc": 88.4,
        "transfer_atk_acc": 40.400000000000006
    },
    {
        "dataset": "qqp",
        "type": "task",
        "origin_acc": 24.1,
        "origin_prompt": "Analyze if the given set of sentences have the same connotation by answering with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 2.0,
        "atk_prompt": "tAnalyze if the giCen est of sentUnces have the same connotatioq by answering with 'equivalent' or 'not_equivalent'. ",
        "transfer_ori_acc": 85.0,
        "transfer_atk_acc": 83.0
    },
    {
        "dataset": "qqp",
        "type": "role",
        "origin_acc": 16.9,
        "origin_prompt": "In the role of a question similarity analyzer, examine the meaning of the provided questions and decide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for different questions.",
        "atk_acc": 0.7,
        "atk_prompt": "IZn the role of a questoion similarity naalyzer, examin the meJaning of the provided questions and Uecide if they are equivalent, answering with 'equivalent' for equivalent questions or 'not_equivalent' for dSfferent questioXns. ",
        "transfer_ori_acc": 87.1,
        "transfer_atk_acc": 86.5
    },
    {
        "dataset": "rte",
        "type": "task",
        "origin_acc": 41.16,
        "origin_prompt": "Determine if the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment'.",
        "atk_acc": 1.08,
        "atk_prompt": "DetermiCne if the givePn pir of sentcnces disWlays entailment or not_entailment. Rtspond with 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 84.11552346570397,
        "transfer_atk_acc": 83.39350180505414
    },
    {
        "dataset": "rte",
        "type": "role",
        "origin_acc": 49.82,
        "origin_prompt": "Working as an entailment classifier, identify whether the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment':",
        "atk_acc": 1.08,
        "atk_prompt": "orking as an entailment clasifier, idenStify whethre the givec ptair of sentInces displays entailment or not_entailment. ReKspond with 'entailment' or 'not_entailment':",
        "transfer_ori_acc": 83.03249097472924,
        "transfer_atk_acc": 83.75451263537906
    },
    {
        "dataset": "sst2",
        "type": "task",
        "origin_acc": 48.05,
        "origin_prompt": "After examining the following expression, label its emotion as either 'positive' or 'negative':",
        "atk_acc": 0.8,
        "atk_prompt": "kfter eximining the followinM expression, labe its emolion as egther 'positive' or 'negative': ",
        "transfer_ori_acc": 93.23394495412845,
        "transfer_atk_acc": 92.88990825688074
    },
    {
        "dataset": "sst2",
        "type": "role",
        "origin_acc": 41.06,
        "origin_prompt": "Functioning as a sentiment identification tool, assess if the following expression is 'positive' or 'negative'. Classify:",
        "atk_acc": 27.18,
        "atk_prompt": "Functionnig as a sentiment identification tool, assess if the flolowing xepression is 'positive' or 'negative'. ClUssify: ",
        "transfer_ori_acc": 94.83944954128441,
        "transfer_atk_acc": 93.46330275229357
    },
    {
        "dataset": "wnli",
        "type": "task",
        "origin_acc": 43.66,
        "origin_prompt": "Determine if the given pair of sentences displays entailment or not_entailment. Respond with 'entailment' or 'not_entailment'.",
        "atk_acc": 0.0,
        "atk_prompt": "VDetermine if the giPen Apair of setences displUays entailment or not_entailment. QRespond with 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 61.97183098591549,
        "transfer_atk_acc": 64.7887323943662
    },
    {
        "dataset": "wnli",
        "type": "role",
        "origin_acc": 43.66,
        "origin_prompt": "In your role as an entailment analysis tool, assess the relationship between the given sentences and classify it as 'entailment' or 'not_entailment':",
        "atk_acc": 0.0,
        "atk_prompt": "kn your rohe as an entailment analysis tool, Zassess the relationship between the gUiven saentences and clasFsify it as 'entailment' or 'not_entailment':",
        "transfer_ori_acc": 56.33802816901409,
        "transfer_atk_acc": 60.56338028169014
    },
    {
        "dataset": "mmlu",
        "type": "task",
        "origin_acc": 25.67,
        "origin_prompt": "Evaluate the multiple-choice question about {} and select the most fitting response from 'A', 'B', 'C', or 'D'.",
        "atk_acc": 14.7,
        "atk_prompt": "Evaluate the multple-choice question about {} and elect the most fitting respone from 'A', 'B', 'C', or 'D'. ",
        "transfer_ori_acc": 44.50354609929078,
        "transfer_atk_acc": 44.32624113475177
    },
    {
        "dataset": "mmlu",
        "type": "role",
        "origin_acc": 25.09,
        "origin_prompt": "As a knowledgeable individual in {}, provide your response to the multiple-choice question by choosing 'A', 'B', 'C', or 'D'.",
        "atk_acc": 16.45,
        "atk_prompt": "As a kAnowledgeable indviidual in {}, provide your ersponse to the multipole-choice quesxion by choosing 'A', 'B', 'C', or 'D'.",
        "transfer_ori_acc": 44.50354609929078,
        "transfer_atk_acc": 44.680851063829785
    }
]