File size: 3,970 Bytes
683d0f6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
[
    {
        "dataset": "cola",
        "type": "translation",
        "origin_acc": 69.0,
        "origin_prompt": "Assess the following sentence and determine if it is grammatically correct. Respond with 'Acceptable' or 'Unacceptable':",
        "atk_acc": 5.8,
        "atk_prompt": "As a tool for analyzing grammatical correctness, it categorizes the grammatical rules of the sentence as 'acceptable' or 'unacceptable'.",
        "transfer_ori_acc": 76.0,
        "transfer_atk_acc": 73.5
    },
    {
        "dataset": "mrpc",
        "type": "translation",
        "origin_acc": 67.16,
        "origin_prompt": "Are the meanings of the following pair of sentences the same? Answer with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 0.74,
        "atk_prompt": "Please determine whether the following two sentences are 'equivalent' or 'not_equivalent' according to the standard of semantic comparison.",
        "transfer_ori_acc": 73.0,
        "transfer_atk_acc": 73.0
    },
    {
        "dataset": "qnli",
        "type": "translation",
        "origin_acc": 38.4,
        "origin_prompt": "As a textual inference expert, analyze if the answer to the question can be deduced from the provided context and select 'entailment' or 'not_entailment'.",
        "atk_acc": 2.4,
        "atk_prompt": "Determine whether the information provided in the context necessarily leads to the answer to the question asked and indicate 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 80.0,
        "transfer_atk_acc": 68.5
    },
    {
        "dataset": "qqp",
        "type": "translation",
        "origin_acc": 30.0,
        "origin_prompt": "Please indicate if the following pair of sentences share the same meaning by responding with 'equivalent' or 'not_equivalent'.",
        "atk_acc": 0.5,
        "atk_prompt": "Work on text sorting tasks labeled 'equivalent' or 'not_equivalent'.",
        "transfer_ori_acc": 81.5,
        "transfer_atk_acc": 56.49999999999999
    },
    {
        "dataset": "rte",
        "type": "translation",
        "origin_acc": 51.26,
        "origin_prompt": "In the role of a semantic relationship analyzer, examine the connection between the given sentences and decide if they exhibit entailment or not_entailment. Answer with 'entailment' or 'not_entailment':",
        "atk_acc": 5.42,
        "atk_prompt": "Classify it as 'entailment' or 'not_entailment' based on the content of the sentence.",
        "transfer_ori_acc": 81.5,
        "transfer_atk_acc": 78.0
    },
    {
        "dataset": "sst2",
        "type": "translation",
        "origin_acc": 53.9,
        "origin_prompt": "Please identify the emotional tone of this passage: 'positive' or 'negative'?",
        "atk_acc": 9.29,
        "atk_prompt": "Please rate the emotion of this sentence and classify it as 'positive' or 'negative'.",
        "transfer_ori_acc": 90.5,
        "transfer_atk_acc": 83.0
    },
    {
        "dataset": "wnli",
        "type": "translation",
        "origin_acc": 43.66,
        "origin_prompt": "Does the relationship between the given sentences represent entailment or not_entailment? Respond with 'entailment' or 'not_entailment'.",
        "atk_acc": 5.63,
        "atk_prompt": "Determine whether the given sentences have a cause-effect relationship as an engagement analysis tool and categorize them as 'entailment' or 'not_entailment'.",
        "transfer_ori_acc": 59.154929577464785,
        "transfer_atk_acc": 38.028169014084504
    },
    {
        "dataset": "mmlu",
        "type": "translation",
        "origin_acc": 27.07,
        "origin_prompt": "For each multiple-choice question about {}, identify the correct answer by selecting 'A', 'B', 'C', or 'D'.",
        "atk_acc": 18.09,
        "atk_prompt": "For the multiple choice problem about, choose the correct answer for '{}' from 'A', 'B', 'C', or 'D'.",
        "transfer_ori_acc": 59.5,
        "transfer_atk_acc": 53.5
    }
]