Miaoran commited on
Commit
b17f672
1 Parent(s): 6ad43c9

Upload 2 files

Browse files
Files changed (2) hide show
  1. eval_results.log +96 -0
  2. mcse.pt +3 -0
eval_results.log ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2021-10-03 08:30:09,513 : ***** Transfer task : STS12 *****
2
+
3
+
4
+ 2021-10-03 08:30:12,822 : MSRpar : pearson = 0.6552, spearman = 0.6487, align_loss = 0.2364, uniform_loss = -2.7071
5
+ 2021-10-03 08:30:14,166 : MSRvid : pearson = 0.8936, spearman = 0.8875, align_loss = 0.2080, uniform_loss = -2.4933
6
+ 2021-10-03 08:30:15,306 : SMTeuroparl : pearson = 0.4988, spearman = 0.5867, align_loss = 0.2905, uniform_loss = -1.7737
7
+ 2021-10-03 08:30:17,420 : surprise.OnWN : pearson = 0.7522, spearman = 0.6933, align_loss = 0.2701, uniform_loss = -2.5032
8
+ 2021-10-03 08:30:18,534 : surprise.SMTnews : pearson = 0.6894, spearman = 0.5845, align_loss = 0.2694, uniform_loss = -1.9022
9
+ 2021-10-03 08:30:18,548 : ALL : Pearson = 0.8190, Spearman = 0.7163, align_loss = 0.2510, uniform_loss = -2.3433
10
+ 2021-10-03 08:30:18,548 : ALL (weighted average) : Pearson = 0.7174, Spearman = 0.6997, align_loss = 0.2499, uniform_loss = -2.3651
11
+ 2021-10-03 08:30:18,548 : ALL (average) : Pearson = 0.6978, Spearman = 0.6802, align_loss = 0.2549, uniform_loss = -2.2759
12
+
13
+ 2021-10-03 08:30:18,555 : ***** Transfer task : STS13 (-SMT) *****
14
+
15
+
16
+ 2021-10-03 08:30:19,558 : FNWN : pearson = 0.6301, spearman = 0.6294, align_loss = 0.3905, uniform_loss = -2.2757
17
+ 2021-10-03 08:30:21,091 : headlines : pearson = 0.8155, spearman = 0.8165, align_loss = 0.2408, uniform_loss = -2.5272
18
+ 2021-10-03 08:30:22,268 : OnWN : pearson = 0.8329, spearman = 0.8242, align_loss = 0.2874, uniform_loss = -2.2479
19
+ 2021-10-03 08:30:22,272 : ALL : Pearson = 0.8145, Spearman = 0.8213, align_loss = 0.2817, uniform_loss = -2.3811
20
+ 2021-10-03 08:30:22,272 : ALL (weighted average) : Pearson = 0.7987, Spearman = 0.7958, align_loss = 0.2771, uniform_loss = -2.3911
21
+ 2021-10-03 08:30:22,272 : ALL (average) : Pearson = 0.7595, Spearman = 0.7567, align_loss = 0.3062, uniform_loss = -2.3503
22
+
23
+ 2021-10-03 08:30:22,274 : ***** Transfer task : STS14 *****
24
+
25
+
26
+ 2021-10-03 08:30:23,499 : deft-forum : pearson = 0.5769, spearman = 0.5598, align_loss = 0.3282, uniform_loss = -2.5534
27
+ 2021-10-03 08:30:24,679 : deft-news : pearson = 0.8023, spearman = 0.7736, align_loss = 0.1958, uniform_loss = -2.4303
28
+ 2021-10-03 08:30:26,339 : headlines : pearson = 0.7991, spearman = 0.7902, align_loss = 0.2404, uniform_loss = -2.5019
29
+ 2021-10-03 08:30:27,948 : images : pearson = 0.8699, spearman = 0.8319, align_loss = 0.2295, uniform_loss = -2.6572
30
+ 2021-10-03 08:30:29,636 : OnWN : pearson = 0.8668, spearman = 0.8523, align_loss = 0.2953, uniform_loss = -2.3135
31
+ 2021-10-03 08:30:31,795 : tweet-news : pearson = 0.7786, spearman = 0.6952, align_loss = 0.4321, uniform_loss = -2.4954
32
+ 2021-10-03 08:30:31,808 : ALL : Pearson = 0.7931, Spearman = 0.7594, align_loss = 0.2930, uniform_loss = -2.4940
33
+ 2021-10-03 08:30:31,808 : ALL (weighted average) : Pearson = 0.7963, Spearman = 0.7630, align_loss = 0.2945, uniform_loss = -2.4944
34
+ 2021-10-03 08:30:31,808 : ALL (average) : Pearson = 0.7823, Spearman = 0.7505, align_loss = 0.2869, uniform_loss = -2.4920
35
+
36
+ 2021-10-03 08:30:31,813 : ***** Transfer task : STS15 *****
37
+
38
+
39
+ 2021-10-03 08:30:33,333 : answers-forums : pearson = 0.7507, spearman = 0.7556, align_loss = 0.5185, uniform_loss = -2.6958
40
+ 2021-10-03 08:30:35,056 : answers-students : pearson = 0.7498, spearman = 0.7557, align_loss = 0.3069, uniform_loss = -1.7109
41
+ 2021-10-03 08:30:36,623 : belief : pearson = 0.8234, spearman = 0.8440, align_loss = 0.4319, uniform_loss = -2.5455
42
+ 2021-10-03 08:30:38,401 : headlines : pearson = 0.8250, spearman = 0.8296, align_loss = 0.2501, uniform_loss = -2.5245
43
+ 2021-10-03 08:30:40,203 : images : pearson = 0.9113, spearman = 0.9161, align_loss = 0.2386, uniform_loss = -2.6473
44
+ 2021-10-03 08:30:40,208 : ALL : Pearson = 0.8383, Spearman = 0.8463, align_loss = 0.3177, uniform_loss = -2.3758
45
+ 2021-10-03 08:30:40,208 : ALL (weighted average) : Pearson = 0.8183, Spearman = 0.8253, align_loss = 0.3177, uniform_loss = -2.3758
46
+ 2021-10-03 08:30:40,208 : ALL (average) : Pearson = 0.8121, Spearman = 0.8202, align_loss = 0.3492, uniform_loss = -2.4248
47
+
48
+ 2021-10-03 08:30:40,212 : ***** Transfer task : STS16 *****
49
+
50
+
51
+ 2021-10-03 08:30:40,999 : answer-answer : pearson = 0.6759, spearman = 0.6784, align_loss = 0.3704, uniform_loss = -2.1641
52
+ 2021-10-03 08:30:41,653 : headlines : pearson = 0.8141, spearman = 0.8351, align_loss = 0.2300, uniform_loss = -2.5482
53
+ 2021-10-03 08:30:42,387 : plagiarism : pearson = 0.8314, spearman = 0.8398, align_loss = 0.2420, uniform_loss = -2.1775
54
+ 2021-10-03 08:30:43,652 : postediting : pearson = 0.8652, spearman = 0.8798, align_loss = 0.1522, uniform_loss = -2.5769
55
+ 2021-10-03 08:30:44,240 : question-question : pearson = 0.6909, spearman = 0.6944, align_loss = 0.2678, uniform_loss = -2.2807
56
+ 2021-10-03 08:30:44,243 : ALL : Pearson = 0.7664, Spearman = 0.7750, align_loss = 0.2525, uniform_loss = -2.3495
57
+ 2021-10-03 08:30:44,243 : ALL (weighted average) : Pearson = 0.7767, Spearman = 0.7868, align_loss = 0.2531, uniform_loss = -2.3528
58
+ 2021-10-03 08:30:44,243 : ALL (average) : Pearson = 0.7755, Spearman = 0.7855, align_loss = 0.2525, uniform_loss = -2.3495
59
+
60
+ 2021-10-03 08:30:44,245 :
61
+
62
+ ***** Transfer task : STSBenchmark*****
63
+
64
+
65
+ 2021-10-03 08:31:03,739 : train : pearson = 0.8231, spearman = 0.8058, align_loss = 0.2532, uniform_loss = -2.6089
66
+ 2021-10-03 08:31:09,180 : dev : pearson = 0.8537, spearman = 0.8558, align_loss = 0.2799, uniform_loss = -2.6759
67
+ 2021-10-03 08:31:13,943 : test : pearson = 0.8001, spearman = 0.7996, align_loss = 0.2558, uniform_loss = -2.5835
68
+ 2021-10-03 08:31:13,953 : ALL : Pearson = 0.8260, Spearman = 0.8164, align_loss = 0.2583, uniform_loss = -2.6166
69
+ 2021-10-03 08:31:13,954 : ALL (weighted average) : Pearson = 0.8247, Spearman = 0.8135, align_loss = 0.2582, uniform_loss = -2.6165
70
+ 2021-10-03 08:31:13,954 : ALL (average) : Pearson = 0.8256, Spearman = 0.8204, align_loss = 0.2630, uniform_loss = -2.6228
71
+
72
+ 2021-10-03 08:31:13,966 :
73
+
74
+ ***** Transfer task : SICKRelatedness*****
75
+
76
+
77
+ 2021-10-03 08:31:26,378 : train : pearson = 0.8149, spearman = 0.7307, align_loss = 0.2282, uniform_loss = -2.5580
78
+ 2021-10-03 08:31:27,937 : dev : pearson = 0.8175, spearman = 0.7571, align_loss = 0.2344, uniform_loss = -2.7867
79
+ 2021-10-03 08:31:41,491 : test : pearson = 0.8030, spearman = 0.7212, align_loss = 0.2274, uniform_loss = -2.5465
80
+ 2021-10-03 08:31:41,514 : ALL : Pearson = 0.8092, Spearman = 0.7273, align_loss = 0.2281, uniform_loss = -2.5639
81
+ 2021-10-03 08:31:41,514 : ALL (weighted average) : Pearson = 0.8091, Spearman = 0.7273, align_loss = 0.2281, uniform_loss = -2.5638
82
+ 2021-10-03 08:31:41,514 : ALL (average) : Pearson = 0.8118, Spearman = 0.7364, align_loss = 0.2300, uniform_loss = -2.6304
83
+
84
+ 2021-10-03 08:31:41,515 : ------ test ------
85
+ 2021-10-03 08:31:41,517 : +--------+--------+--------+--------+--------+--------------+-----------------+--------+
86
+ | STS12 | STS13 | STS14 | STS15 | STS16 | STSBenchmark | SICKRelatedness | Avg. |
87
+ +--------+--------+--------+--------+--------+--------------+-----------------+--------+
88
+ | 71.63 | 82.13 | 75.94 | 84.63 | 77.50 | 79.96 | 72.12 | 77.70 |
89
+ | 0.251 | 0.282 | 0.293 | 0.318 | 0.252 | 0.256 | 0.227 | 0.268 |
90
+ | -2.343 | -2.381 | -2.494 | -2.376 | -2.349 | -2.583 | -2.547 | -2.439 |
91
+ +--------+--------+--------+--------+--------+--------------+-----------------+--------+
92
+ 2021-10-03 08:31:41,518 : +------+------+------+------+------+------+------+------+
93
+ | MR | CR | SUBJ | MPQA | SST2 | TREC | MRPC | Avg. |
94
+ +------+------+------+------+------+------+------+------+
95
+ | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
96
+ +------+------+------+------+------+------+------+------+
mcse.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d19448fcdf0618d946dfca19740a6c9c79814fa6a6275ac99feb35e5897e79e
3
+ size 2887571