Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator

#5
by autoevaluator HF staff - opened
Files changed (1) hide show
  1. README.md +14 -10
README.md CHANGED
@@ -1,11 +1,11 @@
1
  ---
2
  language: en
3
- datasets:
4
- - squad_v2
5
  license: cc-by-4.0
6
  tags:
7
  - deberta
8
  - deberta-v3
 
 
9
  model-index:
10
  - name: deepset/deberta-v3-base-squad2
11
  results:
@@ -18,14 +18,16 @@ model-index:
18
  config: squad_v2
19
  split: validation
20
  metrics:
21
- - name: Exact Match
22
- type: exact_match
23
  value: 83.8248
 
24
  verified: true
25
- - name: F1
26
- type: f1
27
  value: 87.41
 
28
  verified: true
 
29
  - task:
30
  type: question-answering
31
  name: Question Answering
@@ -35,14 +37,16 @@ model-index:
35
  config: plain_text
36
  split: validation
37
  metrics:
38
- - name: Exact Match
39
- type: exact_match
40
  value: 84.9678
 
41
  verified: true
42
- - name: F1
43
- type: f1
44
  value: 92.2777
 
45
  verified: true
 
46
  ---
47
 
48
  # deberta-v3-base for QA
 
1
  ---
2
  language: en
 
 
3
  license: cc-by-4.0
4
  tags:
5
  - deberta
6
  - deberta-v3
7
+ datasets:
8
+ - squad_v2
9
  model-index:
10
  - name: deepset/deberta-v3-base-squad2
11
  results:
 
18
  config: squad_v2
19
  split: validation
20
  metrics:
21
+ - type: exact_match
 
22
  value: 83.8248
23
+ name: Exact Match
24
  verified: true
25
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2IyZTEyYzNlOTAwZmFlNWRiZTdiNzQzMTUyM2FmZTQ3ZWQwNWZmMzc2ZDVhYWYyMzkxOTUyMGNlMWY0M2E5MiIsInZlcnNpb24iOjF9.y8KvfefMLI977BYun0X1rAq5qudmezW_UJe9mh6sYBoiWaBosDO5TRnEGR1BHzdxmv2EgPK_PSomtZvb043jBQ
26
+ - type: f1
27
  value: 87.41
28
+ name: F1
29
  verified: true
30
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOWVhNjAwM2Q5N2Y3MGU4ZWY3N2Y0MmNjYWYwYmQzNTdiYWExODhkYmQ1YjIwM2I1ODEzNWIxZDI1ZWQ1YWRjNSIsInZlcnNpb24iOjF9.Jk0v1ZheLRFz6k9iNAgCMMZtPYj5eVwUCku4E76wRYc-jHPmiUuxvNiNkn6NW-jkBD8bJGMqDSjJyVpVMn9pBA
31
  - task:
32
  type: question-answering
33
  name: Question Answering
 
37
  config: plain_text
38
  split: validation
39
  metrics:
40
+ - type: exact_match
 
41
  value: 84.9678
42
+ name: Exact Match
43
  verified: true
44
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOWUxYTg4MzU3YTdmMDRmMGM0NjFjMTcwNGM3YzljM2RkMTc1ZGNhMDQwMTgwNGI0ZDE4ZGMxZTE3YjY5YzQ0ZiIsInZlcnNpb24iOjF9.KKaJ1UtikNe2g6T8XhLoWNtL9X4dHHyl_O4VZ5LreBT9nXneGc21lI1AW3n8KXTFGemzRpRMvmCDyKVDHucdDQ
45
+ - type: f1
46
  value: 92.2777
47
+ name: F1
48
  verified: true
49
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDU0ZTQwMzg4ZDY1ZWYxOGIxMzY2ODljZTBkMTNlYjA0ODBjNjcxNTg3ZDliYWU1YTdkYTM2NTIxOTg1MGM4OCIsInZlcnNpb24iOjF9.8VHg1BXx6gLw_K7MUK2QSE80Y9guiVR8n8K8nX4laGsLibxv5u_yDv9F3ahbUa1eZG_bbidl93TY2qFUiYHtAQ
50
  ---
51
 
52
  # deberta-v3-base for QA