Add evaluation results on the default config and test split of billsum

#5
by autoevaluator HF staff - opened
Files changed (1) hide show
  1. README.md +33 -0
README.md CHANGED
@@ -57,6 +57,39 @@ model-index:
57
  name: gen_len
58
  verified: true
59
  verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMWZhOGMwMDJjNGU2MzA2YzI1OWU1ZDY5N2NjZmM1YTA5NDg1MzUwNmU1YTBhNjQyNWYwYzA3OGNmODFjMmE2NSIsInZlcnNpb24iOjF9.Rc9u89zCdbFnjsnmq65l_JvCtUwOX_ZWapKJpTZ-rC8HxcUVfi2Ash2QfvvvxHH_YWhwklxxdnNa0HCm46qLAA
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
60
  ---
61
 
62
  # long-t5-tglobal-xl + BookSum
 
57
  name: gen_len
58
  verified: true
59
  verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMWZhOGMwMDJjNGU2MzA2YzI1OWU1ZDY5N2NjZmM1YTA5NDg1MzUwNmU1YTBhNjQyNWYwYzA3OGNmODFjMmE2NSIsInZlcnNpb24iOjF9.Rc9u89zCdbFnjsnmq65l_JvCtUwOX_ZWapKJpTZ-rC8HxcUVfi2Ash2QfvvvxHH_YWhwklxxdnNa0HCm46qLAA
60
+ - task:
61
+ type: summarization
62
+ name: Summarization
63
+ dataset:
64
+ name: billsum
65
+ type: billsum
66
+ config: default
67
+ split: test
68
+ metrics:
69
+ - name: ROUGE-1
70
+ type: rouge
71
+ value: 41.3645
72
+ verified: true
73
+ - name: ROUGE-2
74
+ type: rouge
75
+ value: 16.144
76
+ verified: true
77
+ - name: ROUGE-L
78
+ type: rouge
79
+ value: 24.2981
80
+ verified: true
81
+ - name: ROUGE-LSUM
82
+ type: rouge
83
+ value: 35.3234
84
+ verified: true
85
+ - name: loss
86
+ type: loss
87
+ value: 1.282260775566101
88
+ verified: true
89
+ - name: gen_len
90
+ type: gen_len
91
+ value: 291.8158
92
+ verified: true
93
  ---
94
 
95
  # long-t5-tglobal-xl + BookSum