Add evaluation results on the default config of xsum

#6
by autoevaluator HF staff - opened
Files changed (1) hide show
  1. README.md +66 -0
README.md CHANGED
@@ -45,6 +45,72 @@ model-index:
45
  type: gen_len
46
  value: 209.2537
47
  verified: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  ---
49
 
50
  # BigBirdPegasus model (large)
 
45
  type: gen_len
46
  value: 209.2537
47
  verified: true
48
+ - task:
49
+ type: summarization
50
+ name: Summarization
51
+ dataset:
52
+ name: cnn_dailymail
53
+ type: cnn_dailymail
54
+ config: 3.0.0
55
+ split: test
56
+ metrics:
57
+ - name: ROUGE-1
58
+ type: rouge
59
+ value: 9.0885
60
+ verified: true
61
+ - name: ROUGE-2
62
+ type: rouge
63
+ value: 1.0325
64
+ verified: true
65
+ - name: ROUGE-L
66
+ type: rouge
67
+ value: 7.3182
68
+ verified: true
69
+ - name: ROUGE-LSUM
70
+ type: rouge
71
+ value: 8.1455
72
+ verified: true
73
+ - name: loss
74
+ type: loss
75
+ value: .nan
76
+ verified: true
77
+ - name: gen_len
78
+ type: gen_len
79
+ value: 210.4762
80
+ verified: true
81
+ - task:
82
+ type: summarization
83
+ name: Summarization
84
+ dataset:
85
+ name: xsum
86
+ type: xsum
87
+ config: default
88
+ split: test
89
+ metrics:
90
+ - name: ROUGE-1
91
+ type: rouge
92
+ value: 4.9787
93
+ verified: true
94
+ - name: ROUGE-2
95
+ type: rouge
96
+ value: 0.3527
97
+ verified: true
98
+ - name: ROUGE-L
99
+ type: rouge
100
+ value: 4.3679
101
+ verified: true
102
+ - name: ROUGE-LSUM
103
+ type: rouge
104
+ value: 4.1723
105
+ verified: true
106
+ - name: loss
107
+ type: loss
108
+ value: .nan
109
+ verified: true
110
+ - name: gen_len
111
+ type: gen_len
112
+ value: 230.4886
113
+ verified: true
114
  ---
115
 
116
  # BigBirdPegasus model (large)