autoevaluator HF staff commited on
Commit
755fb5c
1 Parent(s): 6393711

Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator

Browse files

Beep boop, I am a bot from Hugging Face's automatic model evaluator 👋! We've added a new `verifyToken` field to your evaluation results to verify that they are produced by the model evaluator. Accept this PR to ensure that your results remain listed as **verified** on the [Hub leaderboard](https://huggingface.co/spaces/autoevaluate/leaderboards).

Files changed (1) hide show
  1. README.md +134 -90
README.md CHANGED
@@ -5,12 +5,12 @@ license: mit
5
  tags:
6
  - text-classification
7
  - zero-shot-classification
8
- metrics:
9
- - accuracy
10
  datasets:
11
  - multi_nli
12
  - anli
13
  - fever
 
 
14
  pipeline_tag: zero-shot-classification
15
  model-index:
16
  - name: MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli
@@ -24,50 +24,61 @@ model-index:
24
  config: plain_text
25
  split: test_r3
26
  metrics:
27
- - name: Accuracy
28
- type: accuracy
29
  value: 0.495
 
30
  verified: true
31
- - name: Precision Macro
32
- type: precision
33
  value: 0.4984740618243923
 
34
  verified: true
35
- - name: Precision Micro
36
- type: precision
37
  value: 0.495
 
38
  verified: true
39
- - name: Precision Weighted
40
- type: precision
41
  value: 0.4984357572868885
 
42
  verified: true
43
- - name: Recall Macro
44
- type: recall
45
  value: 0.49461028192371476
 
46
  verified: true
47
- - name: Recall Micro
48
- type: recall
49
  value: 0.495
 
50
  verified: true
51
- - name: Recall Weighted
52
- type: recall
53
  value: 0.495
 
54
  verified: true
55
- - name: F1 Macro
56
- type: f1
57
  value: 0.4942810999491704
 
58
  verified: true
59
- - name: F1 Micro
60
- type: f1
61
  value: 0.495
 
62
  verified: true
63
- - name: F1 Weighted
64
- type: f1
65
  value: 0.4944671868893595
 
66
  verified: true
67
- - name: loss
68
- type: loss
69
  value: 1.8788293600082397
 
70
  verified: true
 
71
  - task:
72
  type: natural-language-inference
73
  name: Natural Language Inference
@@ -77,50 +88,61 @@ model-index:
77
  config: plain_text
78
  split: test_r1
79
  metrics:
80
- - name: Accuracy
81
- type: accuracy
82
  value: 0.712
 
83
  verified: true
84
- - name: Precision Macro
85
- type: precision
86
  value: 0.7134839439315348
 
87
  verified: true
88
- - name: Precision Micro
89
- type: precision
90
  value: 0.712
 
91
  verified: true
92
- - name: Precision Weighted
93
- type: precision
94
  value: 0.7134676028447461
 
95
  verified: true
96
- - name: Recall Macro
97
- type: recall
98
  value: 0.7119814425203647
 
99
  verified: true
100
- - name: Recall Micro
101
- type: recall
102
  value: 0.712
 
103
  verified: true
104
- - name: Recall Weighted
105
- type: recall
106
  value: 0.712
 
107
  verified: true
108
- - name: F1 Macro
109
- type: f1
110
  value: 0.7119226991285647
 
111
  verified: true
112
- - name: F1 Micro
113
- type: f1
114
  value: 0.712
 
115
  verified: true
116
- - name: F1 Weighted
117
- type: f1
118
  value: 0.7119242267218338
 
119
  verified: true
120
- - name: loss
121
- type: loss
122
  value: 1.0105403661727905
 
123
  verified: true
 
124
  - task:
125
  type: natural-language-inference
126
  name: Natural Language Inference
@@ -130,50 +152,61 @@ model-index:
130
  config: default
131
  split: validation_mismatched
132
  metrics:
133
- - name: Accuracy
134
- type: accuracy
135
  value: 0.902766476810415
 
136
  verified: true
137
- - name: Precision Macro
138
- type: precision
139
  value: 0.9023816542652491
 
140
  verified: true
141
- - name: Precision Micro
142
- type: precision
143
  value: 0.902766476810415
 
144
  verified: true
145
- - name: Precision Weighted
146
- type: precision
147
  value: 0.9034597464719761
 
148
  verified: true
149
- - name: Recall Macro
150
- type: recall
151
  value: 0.9024304801555488
 
152
  verified: true
153
- - name: Recall Micro
154
- type: recall
155
  value: 0.902766476810415
 
156
  verified: true
157
- - name: Recall Weighted
158
- type: recall
159
  value: 0.902766476810415
 
160
  verified: true
161
- - name: F1 Macro
162
- type: f1
163
  value: 0.9023086094638595
 
164
  verified: true
165
- - name: F1 Micro
166
- type: f1
167
  value: 0.902766476810415
 
168
  verified: true
169
- - name: F1 Weighted
170
- type: f1
171
  value: 0.9030161011457231
 
172
  verified: true
173
- - name: loss
174
- type: loss
175
  value: 0.3283354640007019
 
176
  verified: true
 
177
  - task:
178
  type: natural-language-inference
179
  name: Natural Language Inference
@@ -183,50 +216,61 @@ model-index:
183
  config: plain_text
184
  split: dev_r1
185
  metrics:
186
- - name: Accuracy
187
- type: accuracy
188
  value: 0.737
 
189
  verified: true
190
- - name: Precision Macro
191
- type: precision
192
  value: 0.737681071614645
 
193
  verified: true
194
- - name: Precision Micro
195
- type: precision
196
  value: 0.737
 
197
  verified: true
198
- - name: Precision Weighted
199
- type: precision
200
  value: 0.7376755842752241
 
201
  verified: true
202
- - name: Recall Macro
203
- type: recall
204
  value: 0.7369675064285843
 
205
  verified: true
206
- - name: Recall Micro
207
- type: recall
208
  value: 0.737
 
209
  verified: true
210
- - name: Recall Weighted
211
- type: recall
212
  value: 0.737
 
213
  verified: true
214
- - name: F1 Macro
215
- type: f1
216
  value: 0.7366853496239583
 
217
  verified: true
218
- - name: F1 Micro
219
- type: f1
220
  value: 0.737
 
221
  verified: true
222
- - name: F1 Weighted
223
- type: f1
224
  value: 0.7366990292378379
 
225
  verified: true
226
- - name: loss
227
- type: loss
228
  value: 0.9349392056465149
 
229
  verified: true
 
230
  ---
231
  # DeBERTa-v3-base-mnli-fever-anli
232
  ## Model description
 
5
  tags:
6
  - text-classification
7
  - zero-shot-classification
 
 
8
  datasets:
9
  - multi_nli
10
  - anli
11
  - fever
12
+ metrics:
13
+ - accuracy
14
  pipeline_tag: zero-shot-classification
15
  model-index:
16
  - name: MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli
 
24
  config: plain_text
25
  split: test_r3
26
  metrics:
27
+ - type: accuracy
 
28
  value: 0.495
29
+ name: Accuracy
30
  verified: true
31
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYWViYjQ5YTZlYjU4NjQyN2NhOTVhNjFjNGQyMmFiNmQyZjRkOTdhNzJmNjc3NGU4MmY0MjYyMzY5MjZhYzE0YiIsInZlcnNpb24iOjF9.S8pIQ7gEGokd_wKXMi6Bc3B2DThIP3cvVkTFErZ-2JxXTSCy1TBuulY3dzGfaiP7kTHbL52OuBhG_-wb7Ue9DQ
32
+ - type: precision
33
  value: 0.4984740618243923
34
+ name: Precision Macro
35
  verified: true
36
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOTllZDU3NmVmYjk4ZmYzNjAwNzExMGZjNDMzOWRkZjRjMTRhNzhlZmI0ZmNlM2E0Mzk4OWE5NTM5MTYyYWU5NCIsInZlcnNpb24iOjF9.WHz_TUJgPVn-rU-9vBCDdmSMOuWzADwr09rJY6ktqRM46zytbyWs7Vcm7jqDrTkfU-rp0_7IyoNv_xEsKhJbBA
37
+ - type: precision
38
  value: 0.495
39
+ name: Precision Micro
40
  verified: true
41
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjllODE3ZjUxZDhiMTI0MzZmYjY5OTUwYWI2OTc4ZjJhNTVjMjY2ODdkMmJlZjQ5YWQ1Mjk2ZThmYjJlM2RlYSIsInZlcnNpb24iOjF9.a9V06-O7l9S0Bv4vj0aard8128SAP61DZdXl_3XqdmNgt_C6KAoDBVueF2M2kF_kT6lRfEz6YW0ACIfJNXDYAA
42
+ - type: precision
43
  value: 0.4984357572868885
44
+ name: Precision Weighted
45
  verified: true
46
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjhiMzYzY2JiMmYwN2YxYzEwZTQ3NGI1NzFmMzliNjJkMDE2YzI5Njg1ZjEzMGIxODdiMDNmYmI4Y2Y2MmJkMiIsInZlcnNpb24iOjF9.xvZZaUMogw9MJjb3ls6h5liDlTqHMmNgqk6KbyDqQWfCcD255brCU3Xo6nECwaChS4te0dQu_iWGBqR_o2kYAA
47
+ - type: recall
48
  value: 0.49461028192371476
49
+ name: Recall Macro
50
  verified: true
51
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDVjYTEzOTI0ZjVhOTk3ZTkzZmZhNTk5ODcxMWJhYWU4ZTRjYWVhNzcwOWY5YmI2NGFlYWE4NjM5MDY5NTExOSIsInZlcnNpb24iOjF9.xgHCB2rbCQBzHzUokw4u8JyOdhtF4yvPv1t8t7YiEkaAuM5MAPsVuCZ1VtlLapHS_IWetlocizsVl6akjh3cAQ
52
+ - type: recall
53
  value: 0.495
54
+ name: Recall Micro
55
  verified: true
56
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYTEyYmM0ZDQ0M2RiMDNhNjIxNzQ4OWZiNTBiOTAwZDFkNjNmYjBhNjA4NmQ0NjFkNmNiZTljNDkxNDg3NzIyYSIsInZlcnNpb24iOjF9.3FJPwNtwgFNvMjVxVAayaVXXR1sWlr0sqAYmXzmMzMxl7IJh6RS77dGPwFaqD3jamLVBiqPn9wsfz5lFK5yTAA
57
+ - type: recall
58
  value: 0.495
59
+ name: Recall Weighted
60
  verified: true
61
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmY1MjZlZTQ4OTg5YzdlYmFhZDMzMmNlNjNkYmIyZGI4M2NjZjQ1ZDVkNmZkMTUxNjI3M2UwZmI1MDM1NDYwOSIsInZlcnNpb24iOjF9.cnbM6xjTLRa9z0wEDGd_Q4lTXVLRKIQ6_YLGLjf-t7Nto4lzxAeWF-RrwA0Mq9OPITlJq2Jk1Eg_0Utb13d9Dg
62
+ - type: f1
63
  value: 0.4942810999491704
64
+ name: F1 Macro
65
  verified: true
66
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2U3NGM1MDM4YTM4NzQxMGM4ZTIyZDM2YTQ1MGNlZWM1MzEzM2MxN2ZmZmRmYTM0OWJmZGJjYjM5OWEzMmZjNSIsInZlcnNpb24iOjF9.vMtge1F-tmMn9D3aVUuwcNEXjqpNgEyHAl9f5UDSoTYcOgTwi2vi5yRGRCl8y6Fx7BtgaCwMyoZVNbP5-GRtCA
67
+ - type: f1
68
  value: 0.495
69
+ name: F1 Micro
70
  verified: true
71
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjBjMTQ5MmQ5OGE5OWJjZGMyNzg4N2RmNDUzMzQ5Zjc4ZTc4N2JlMTk0MTc2M2RjZTgzOTNlYWQzODAwNDI0NCIsInZlcnNpb24iOjF9.yxXG0CNWW8__xJC14BjbTY9QkXD75x6uCIXR51oKDemkP0b_xGyd-A2wPIuwNJN1EYkQevPY0bhVpRWBKyO9Bg
72
+ - type: f1
73
  value: 0.4944671868893595
74
+ name: F1 Weighted
75
  verified: true
76
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzczNjQzY2FmMmY4NTAwYjNkYjJlN2I2NjI2Yjc0ZmQ3NjZiN2U5YWEwYjk4OTUyOTMzZTYyZjYzOTMzZGU2YiIsInZlcnNpb24iOjF9.mLOnst2ScPX7ZQwaUF12W2nv7-w9lX9-BxHl3-0T0gkSWnmtBSwYcL5faTX0_I5q33Fjz5tfkjpCJuxP5JYIBQ
77
+ - type: loss
78
  value: 1.8788293600082397
79
+ name: loss
80
  verified: true
81
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzRlOTYwYjU1Y2Y4ZGM0NDBjYTE2MmEzNWIwN2NiMWVkOWZlNzA2ZmQ3YjZjNzI4MjQwYWZhODIwMzU3ODAyZiIsInZlcnNpb24iOjF9._Xs9bl48MSavvp5eyamrP2iNlFWv35QZCrmWjJXLkUdIBx0ElCjEdxBb3dxPGnUxdpDzGMmOoKCPI44ZPXrtDw
82
  - task:
83
  type: natural-language-inference
84
  name: Natural Language Inference
 
88
  config: plain_text
89
  split: test_r1
90
  metrics:
91
+ - type: accuracy
 
92
  value: 0.712
93
+ name: Accuracy
94
  verified: true
95
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYWYxMGY0ZWU0YTEyY2I3NmQwZmQ3YmFmNzQxNGU5OGNjN2ViN2I0ZjdkYWUzM2RmYzkzMDg3ZjVmNGYwNGZkZCIsInZlcnNpb24iOjF9.snWBusAeo1rrQqWk--vTxb-CBcFqM298YCtwTQGBZiFegKGSTSKzj-SM6HMNsmoQWmMuv7UfYPqYlnzEthOSAg
96
+ - type: precision
97
  value: 0.7134839439315348
98
+ name: Precision Macro
99
  verified: true
100
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjMxMjg1Y2QwNzMwM2ZkNGM3ZTJhOGJmY2FkNGI1ZTFhOGQ3ODViNTJmZTYwMWJkZDYyYWRjMzFmZDI1NTM5YSIsInZlcnNpb24iOjF9.ZJnY6zYOBn-YEtN7uKzQ-VKXPwlIO1zq19Yuo37vBJNSs1dGDd8f1jgfdZuA19e_wA3Nc5nQKe9VXRwPHPgwAQ
101
+ - type: precision
102
  value: 0.712
103
+ name: Precision Micro
104
  verified: true
105
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZWM4YWQyODBlYTIwMWQxZDA1NmY1M2M2ODgwNDJiY2RhMDVhYTlkMDUzZTJkMThkYzRmNDg2YTdjMjczNGUwOCIsInZlcnNpb24iOjF9.SogsKHdbdlEs05IBYwXvlnaC_esg-DXAPc2KPRyHaVC5ItVHbxa63NpybSpao4baOoMlLG9aRe7TjG4gtB2dAQ
106
+ - type: precision
107
  value: 0.7134676028447461
108
+ name: Precision Weighted
109
  verified: true
110
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODdjMzFkM2IwNWZiM2I4ZWViMmQ4NWM5MDY5ZWQxZjc1MGRmNjhmNzJhYWFmOWEwMjg3ZjhiZWM3YjlhOTIxNSIsInZlcnNpb24iOjF9._0JNIbiqLuDZrp_vrCljBe28xexZJPmigLyhkcO8AtH2VcNxWshwCpZuRF4bqvpMvnApJeuGMf3vXjCj0MC1Bw
111
+ - type: recall
112
  value: 0.7119814425203647
113
+ name: Recall Macro
114
  verified: true
115
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYjU4MWEyMzkyYzg1ZTIxMTc0M2NhMTgzOGEyZmY5OTg3M2Q1ZmMwNmU3ZmU1ZjA1MDk0OGZkMzM5NDVlZjBlNSIsInZlcnNpb24iOjF9.sZ3GTcmGGthpTLL7_Zovq8aBmE3Dp_PZi5v8ZI9yG9N6B_GjWvBuPC8ENXK1NwmwiHLsSvtKTG5JmAum-su0Dg
116
+ - type: recall
117
  value: 0.712
118
+ name: Recall Micro
119
  verified: true
120
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDg3NGViZTlmMWM2ZDNhMzIzZGZkYWZhODQxNzg2MjNiNjQ0Zjg0NjQ1OWZkY2I5ODdiY2Y3Y2JjNzRmYjJkMiIsInZlcnNpb24iOjF9.bCZUzJamsozKWehnNph6E5coww5zZTrJdbWevWrSyfT0PyXc_wkZ-NKdyBAoqprBz3_8L3i5hPM6Qsy56b4BDA
121
+ - type: recall
122
  value: 0.712
123
+ name: Recall Weighted
124
  verified: true
125
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDk1MDJiOGUzZThlZjJjMzY4NjMzODFiZjUzZmIwMjIxY2UwNzBiN2IxMWEwMGJjZTkxODA0YzUxZDE3ODRhOCIsInZlcnNpb24iOjF9.z0dqvB3aBVYt3xRIb_M4svWebfQc0QaDFVFzHnlA5QGEHkHOW3OecGhHE4EzBqTDI3DASWZTGMjrMDDt0uOMBw
126
+ - type: f1
127
  value: 0.7119226991285647
128
+ name: F1 Macro
129
  verified: true
130
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiM2U0YjMwNzhmOTEyNDZhODU3MTU0YTM4MmQ0NzEzNWI1YjY0ZWQ3MWRiMTdiNTUzNWRkZThjMWE4M2NkZmI0MiIsInZlcnNpb24iOjF9.hhj1BXkuWi9wXrCjT9NwqaPETtOoYNiyqYsJEw-ufA8A4hVThKA6ZBtma1Q_M65-DZFfPEBDBNASLZ7EPSbmDw
131
+ - type: f1
132
  value: 0.712
133
+ name: F1 Micro
134
  verified: true
135
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODk0Y2EyMzc5M2ZlNWFlNDg2Zjc1OTQxNGY3YjA5YjUxYTYzZjRlZmU4ODYxNjA3ZjkxNGUzYjBmNmMxMzY5YiIsInZlcnNpb24iOjF9.DvKk-3hNh2LhN2ug5e0FgUntL3Ozdfl06Kz7jvmB-deOJH6INi2a2ZySXoEePoo8t2nR6ENFYu9QjMA2ojnpCA
136
+ - type: f1
137
  value: 0.7119242267218338
138
+ name: F1 Weighted
139
  verified: true
140
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2MxOWFlMmI2NGRiMjkwN2Q5MWZhNDFlYzQxNWNmNzQ3OWYxZThmNDU2OWU1MTE5OGY2MWRlYWUyNDM3OTkzZCIsInZlcnNpb24iOjF9.QrTD1gE8_wRok9u59W-Mx0cX89K-h2Ad6qa8J5rmP8lc_rkG0ft2n5_GqH1CBZBJwMFYv91Pn6TuE3eGxJuUDA
141
+ - type: loss
142
  value: 1.0105403661727905
143
+ name: loss
144
  verified: true
145
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMmUwMTg4NjM3ZTBiZTIyODcyNDNmNTE5ZDZhMzNkMDMyNjcwOGQ5NmY0NTlhMjgyNmIzZjRiNDFiNjA3M2RkZSIsInZlcnNpb24iOjF9.sjBDVJV-jnygwcppmByAXpoo-Wzz178bBzozJEuYEiJaHSbk_xEevfJS1PmLUuplYslKb1iyEctnjI-5bl-XDw
146
  - task:
147
  type: natural-language-inference
148
  name: Natural Language Inference
 
152
  config: default
153
  split: validation_mismatched
154
  metrics:
155
+ - type: accuracy
 
156
  value: 0.902766476810415
157
+ name: Accuracy
158
  verified: true
159
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjExZWM3YzA3ZDNlNjEwMmViNWEwZTE3MjJjNjEyNDhjOTQxNGFmMzBjZTk0ODUwYTc2OGNiZjYyMTBmNWZjZSIsInZlcnNpb24iOjF9.zbFAGrv2flpmweqS7Poxib7qHFLdW8eUTzshdOm2B9H-KWpIZCWC-P4p8TLMdNJnUcZJZ03Okil4qjIMqqIRCA
160
+ - type: precision
161
  value: 0.9023816542652491
162
+ name: Precision Macro
163
  verified: true
164
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2U2MGViNmJjNWQxNzRjOTkxNDIxZjZjNmM5YzE4ZjU5NTE5NjFlNmEzZWRlOGYxN2E3NTAwMTEwYjNhNzE0YSIsInZlcnNpb24iOjF9.WJjDJf56FROvf7Y5ShWnnxMvK_ZpQ2PibAOtSFhSiYJ7bt4TGOzMwaZ5RSTf_mcfXgRfWbXmy1jCwNhDb-5EAw
165
+ - type: precision
166
  value: 0.902766476810415
167
+ name: Precision Micro
168
  verified: true
169
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzRhZTExOTc5NDczZjI1YmMzOGYyOTU2MDU1OGE5ZTczMDE0MmU0NzZhY2YzMDI1ZGQ3MGM5MmJiODFkNzUzZiIsInZlcnNpb24iOjF9.aRYcGEI1Y8-a0d8XOoXhBgsFyj9LWNwEjoIPc594y7kJn91wXIsXoR0-_0iy3uz41mWaTTlwJx7lI-kipFDvDQ
170
+ - type: precision
171
  value: 0.9034597464719761
172
+ name: Precision Weighted
173
  verified: true
174
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMWQyMTZiZDA2OTUwZjRmNTFiMWRlZTNmOTliZmI2MWFmMjdjYzEyYTgwNzkyOTQzOTBmNTUyYjMwNTUxMTFkNiIsInZlcnNpb24iOjF9.hUtAMTl0THHUkaLcgk1Vy9IhjqJAXCJ_5STJ5A7k7s_SO9DHp3b6qusgwPmcGLYyPy1-j1dB2AIstxK4tHfmDA
175
+ - type: recall
176
  value: 0.9024304801555488
177
+ name: Recall Macro
178
  verified: true
179
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzAxZGJhNGI3ZDNlMjg2ZDIxNTgwMDY5MTFjM2ExZmIxMDBmZjUyNTliNWNkOGI0OTY3NTYyNWU3OWFlYTA3YiIsInZlcnNpb24iOjF9.1o_GNq8zmXa_50MUF_K63IDc2aUKNeUkNQ5fT592-SAo8WgiaP9Dh6bOEu2OqrpRQ57P4qm7OdJt7UKsrosMDA
180
+ - type: recall
181
  value: 0.902766476810415
182
+ name: Recall Micro
183
  verified: true
184
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjhiMWE4Yjk0ODFkZjlkYjRlMjU1OTJmMjA2Njg1N2M4MzQ0OWE3N2FlYjY4NDgxZThjMmExYWQ5OGNmYmI1NSIsInZlcnNpb24iOjF9.Gmm5lf_qpxjXWWrycDze7LHR-6WGQc62WZTmcoc5uxWd0tivEUqCAFzFdbEU1jVKxQBIyDX77CPuBm7mUA4sCg
185
+ - type: recall
186
  value: 0.902766476810415
187
+ name: Recall Weighted
188
  verified: true
189
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2EzZWYwNjNkYWE1YTcyZGZjNTNhMmNlNzgzYjk5MGJjOWJmZmE5NmYwM2U2NTA5ZDY3ZjFiMmRmZmQwY2QwYiIsInZlcnNpb24iOjF9.yA68rslg3e9kUR3rFTNJJTAad6Usr4uFmJvE_a7G2IvSKqLxG_pqsHszsWfg5mFBQLjWEAyCtdQYMdVayuYMBA
190
+ - type: f1
191
  value: 0.9023086094638595
192
+ name: F1 Macro
193
  verified: true
194
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzMyMzZhNjI5MWRmZWJhMjkzN2E0MjM4ZTM5YzZmNTk5YTZmYzU4NDRiYjczZGQ4MDdhNjJiMGU0MjE3NDEwNyIsInZlcnNpb24iOjF9.RCMqH_xUMN97Vos54pTFfAMbLstXUMdFTs-eNaypbDb_Fc-MW8NLmJ6dzJsp9sSvhXyYjugjRMUpMpnQseKXDA
195
+ - type: f1
196
  value: 0.902766476810415
197
+ name: F1 Micro
198
  verified: true
199
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTYxZTZhZGM0NThlNTAzNmYwMTA4NDNkN2FiNzhhN2RlYThlYjcxMjE5MjBkMzhiOGYxZGRmMjE0NGM2ZWQ5ZSIsInZlcnNpb24iOjF9.wRfllNw2Gibmi1keU7d_GjkyO0F9HESCgJlJ9PHGZQRRT414nnB-DyRvulHjCNnaNjXqMi0LJimC3iBrNawwAw
200
+ - type: f1
201
  value: 0.9030161011457231
202
+ name: F1 Weighted
203
  verified: true
204
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDA0YjAxMWU5MjI4MWEzNTNjMzJlNjM3ZDMxOTE0ZTZhYmZlNmUyNDViNTU2NmMyMmM3MjAxZWVjNWJmZjI4MCIsInZlcnNpb24iOjF9.vJ8aUjfTbFMc1BgNUVpoVDuYwQJYQjwZQxblkUdvSoGtkW_AzQJ_KJ8Njc7IBA3ADgj8iZHjRQNIZkFCf-xICw
205
+ - type: loss
206
  value: 0.3283354640007019
207
+ name: loss
208
  verified: true
209
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODdmYzYzNTUzZDNmOWIxM2E0ZmUyOWUzM2Y2NGRmZDNiYjg3ZTMzYTUyNzg3OWEzNzYyN2IyNmExOGRlMWUxYSIsInZlcnNpb24iOjF9.Qv0FzFZPkcBs9aHGf4TEREX4jdkc40NazdMlP2M_-w2wHwyjoAjvhk611RLXHcbicozNelZJLnsOMdEMnPLEDg
210
  - task:
211
  type: natural-language-inference
212
  name: Natural Language Inference
 
216
  config: plain_text
217
  split: dev_r1
218
  metrics:
219
+ - type: accuracy
 
220
  value: 0.737
221
+ name: Accuracy
222
  verified: true
223
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMTQ1ZGVkOTVmNTlhYjhkMjVlNTNhMjNmZWFjZWZjZjcxZmRhMDVlOWI0YTdkOTMwYjVjNWFlOGY4OTc1MmRhNiIsInZlcnNpb24iOjF9.wGLgKA1E46ljbLokdPeip_UCr1gqK8iSSbsJKX2vgKuuhDdUWWiECrUFN-bv_78JWKoKW5T0GF_hb-RVDzA0AQ
224
+ - type: precision
225
  value: 0.737681071614645
226
+ name: Precision Macro
227
  verified: true
228
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYmFkMGUwMjNhN2E3NzMxNTc5NDM0MjY1MGU5ODllM2Q2YzA1MDI3OGI1ZmI4YTcxN2E4ZDk5OWY2OGNiN2I0MCIsInZlcnNpb24iOjF9.6G5qhccjheaNfasgRyrkKBTaQPRzuPMZZ0hrLxTNzAydMDgx09FkFP3hni7WLRMWp0IpwzkEeBlxV-mPyQBtBw
229
+ - type: precision
230
  value: 0.737
231
+ name: Precision Micro
232
  verified: true
233
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2QzYjQ4ZDZjOGU5YzI3YmFlMThlYTRkYTUyYWIyNzc4NDkwNzM1OWFiMTgyMzA0NDZmMGI3YTQxODBjM2EwMCIsInZlcnNpb24iOjF9.bvNWyzfct1CLJFx_EuD2GeKieVtyGJy0cwUBP2qJE1ey2i9SVn6n1Dr0AALTGBkxQ6n5-fJ61QFNufpdr2KvCA
234
+ - type: precision
235
  value: 0.7376755842752241
236
+ name: Precision Weighted
237
  verified: true
238
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2VmYWYzZWQwZmMzMDk0NTdlY2Y3NDkzYWY5ZTdmOGU0ZTUzZWE4YWFhZjVmODhkZmE1Njg4NjA5YjJmYWVhOSIsInZlcnNpb24iOjF9.50FQR2aoBpORLgYa7482ZTrRhT-KfIgv5ltBEHndUBMmqGF9Ru0LHENSGwyD_tO89sGPfiW32TxpbrNWiBdIBA
239
+ - type: recall
240
  value: 0.7369675064285843
241
+ name: Recall Macro
242
  verified: true
243
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTM4OTAyNDYwNjY4Zjc5NDljNjBmNTg2Mzk4YjYxM2MyYTA0MDllYTMyNzEwOGI1ZTEwYWE3ZmU0NDZmZDg2NiIsInZlcnNpb24iOjF9.UvWBxuApNV3vd4hpgwqd6XPHCbkA_bB_Cw24ooquiOf0dstvjP3JvpGoDp5SniOzIOg3i2aYbcvFCLJqEXMZCQ
244
+ - type: recall
245
  value: 0.737
246
+ name: Recall Micro
247
  verified: true
248
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYmQ4MjMzNzRmNTI5NjIzNGQ0ZDFmZTA1MDU3OTk0MzYyMGI0NTMzZTZlMTQ1MDc1MzBkMGMzYjcxZjU1NDNjOSIsInZlcnNpb24iOjF9.kpbdXOpDG3CUB-kUEXsgFT3HWWIbu70wwzs2TNf0rhIuRrzdZz3dXXvwqu1BcLJTsOxl8G6NTiYXgnv-ul8lDg
249
+ - type: recall
250
  value: 0.737
251
+ name: Recall Weighted
252
  verified: true
253
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmU1ZWJkNWE0NjczY2NiZWYyNzYyMzllNzZmZTIxNWRkYTEyZDgxN2E0NTNmM2ExMTc1ZWVjMzBiYjg0ZmM1MiIsInZlcnNpb24iOjF9.S6HHWCWnut_LJqXbEA_Z8ZOTtyq6V51ZeiA0qbwzr0hapDYZOZHrN4prvSLvoNv-GiYDYKatwIsAZxCZc5fmCA
254
+ - type: f1
255
  value: 0.7366853496239583
256
+ name: F1 Macro
257
  verified: true
258
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNzkxYmY2NTcyOTE0ZDdjNGY2ZmE4MzQwMGIxZTA2MDg1NzI5YTQ0MTdkZjdkNzNkMDM2NTk2MTNiNjU4ODMwZCIsInZlcnNpb24iOjF9.ECVaCBqGd0pnQT3xJF7yWrgecIb-5TMiVWpEO0MQGhYy43snkI6Qs-2FOXzvfwIWqG-Q6XIIhGbWZh5TFEGKCA
259
+ - type: f1
260
  value: 0.737
261
+ name: F1 Micro
262
  verified: true
263
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDMwMWZiNzQyNWEzNmMzMDJjOTAxYzAxNzc0MTNlYzRkZjllYmNjZmU0OTgzZDFkNWM1ZWI5OTA2NzE5Y2YxOSIsInZlcnNpb24iOjF9.8yZFol_Gcj9n3w9Yk5wx48yql7p3wriDecv-6VSTAB6Q_MWLQAWsCEGRRhgGJ3zvhoRehJZdb35ozk36VOinDQ
264
+ - type: f1
265
  value: 0.7366990292378379
266
+ name: F1 Weighted
267
  verified: true
268
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjhhN2ZkMjc5ZGQ3ZGM1Nzk3ZTgwY2E1N2NjYjdhNjZlOTdhYmRlNGVjN2EwNTIzN2UyYTY2ODVlODhmY2Q4ZCIsInZlcnNpb24iOjF9.Cz7ClDAfCGpqdRTYd5v3dPjXFq8lZLXx8AX_rqmF-Jb8KocqVDsHWeZScW5I2oy951UrdMpiUOLieBuJLOmCCQ
269
+ - type: loss
270
  value: 0.9349392056465149
271
+ name: loss
272
  verified: true
273
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmI4MTI5MDM1NjBmMzgzMzc2NjM5MzZhOGUyNTgyY2RlZTEyYTIzYzY2ZGJmODcxY2Q5OTVjOWU3OTQ2MzM1NSIsInZlcnNpb24iOjF9.bSOFnYC4Y2y2pW1AR-bgPUHKafR-0OHf8PvexK8eQLsS323Xy9-rYkKUaP09KY6_fk9GqAawv5eqj72B_uyeCA
274
  ---
275
  # DeBERTa-v3-base-mnli-fever-anli
276
  ## Model description