sjrhuschlee commited on
Commit
eb52a60
1 Parent(s): 26366e7

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +38 -38
README.md CHANGED
@@ -40,10 +40,10 @@ model-index:
40
  split: validation
41
  metrics:
42
  - type: exact_match
43
- value: 86.320
44
  name: Exact Match
45
  - type: f1
46
- value: 92.947
47
  name: F1
48
  - task:
49
  type: question-answering
@@ -54,12 +54,12 @@ model-index:
54
  config: adversarialQA
55
  split: validation
56
  metrics:
57
- - type: exact_match
58
- value: 23.133
59
- name: Exact Match
60
- - type: f1
61
- value: 31.386
62
- name: F1
63
  - task:
64
  type: question-answering
65
  name: Question Answering
@@ -70,71 +70,71 @@ model-index:
70
  split: validation
71
  metrics:
72
  - type: exact_match
73
- value: 68.159
74
  name: Exact Match
75
  - type: f1
76
- value: 71.876
77
  name: F1
78
  - task:
79
  type: question-answering
80
  name: Question Answering
81
  dataset:
82
- name: squadshifts
83
  type: squadshifts
84
  config: amazon
85
  split: test
86
  metrics:
87
- - type: exact_match
88
- value: 67.587
89
- name: Exact Match
90
- - type: f1
91
- value: 80.085
92
- name: F1
93
  - task:
94
  type: question-answering
95
  name: Question Answering
96
  dataset:
97
- name: squadshifts
98
  type: squadshifts
99
  config: new_wiki
100
  split: test
101
  metrics:
102
- - type: exact_match
103
- value: 77.261
104
- name: Exact Match
105
- - type: f1
106
- value: 85.068
107
- name: F1
108
  - task:
109
  type: question-answering
110
  name: Question Answering
111
  dataset:
112
- name: squadshifts
113
  type: squadshifts
114
  config: nyt
115
  split: test
116
  metrics:
117
- - type: exact_match
118
- value: 79.066
119
- name: Exact Match
120
- - type: f1
121
- value: 86.178
122
- name: F1
123
  - task:
124
  type: question-answering
125
  name: Question Answering
126
  dataset:
127
- name: squadshifts
128
  type: squadshifts
129
  config: reddit
130
  split: test
131
  metrics:
132
- - type: exact_match
133
- value: 65.052
134
- name: Exact Match
135
- - type: f1
136
- value: 74.785
137
- name: F1
138
  ---
139
 
140
  # flan-t5-base for Extractive QA
 
40
  split: validation
41
  metrics:
42
  - type: exact_match
43
+ value: 86.367
44
  name: Exact Match
45
  - type: f1
46
+ value: 92.965
47
  name: F1
48
  - task:
49
  type: question-answering
 
54
  config: adversarialQA
55
  split: validation
56
  metrics:
57
+ - type: exact_match
58
+ value: 34.167
59
+ name: Exact Match
60
+ - type: f1
61
+ value: 46.911
62
+ name: F1
63
  - task:
64
  type: question-answering
65
  name: Question Answering
 
70
  split: validation
71
  metrics:
72
  - type: exact_match
73
+ value: 80.862
74
  name: Exact Match
75
  - type: f1
76
+ value: 86.070
77
  name: F1
78
  - task:
79
  type: question-answering
80
  name: Question Answering
81
  dataset:
82
+ name: squadshifts amazon
83
  type: squadshifts
84
  config: amazon
85
  split: test
86
  metrics:
87
+ - type: exact_match
88
+ value: 71.624
89
+ name: Exact Match
90
+ - type: f1
91
+ value: 85.113
92
+ name: F1
93
  - task:
94
  type: question-answering
95
  name: Question Answering
96
  dataset:
97
+ name: squadshifts new_wiki
98
  type: squadshifts
99
  config: new_wiki
100
  split: test
101
  metrics:
102
+ - type: exact_match
103
+ value: 82.389
104
+ name: Exact Match
105
+ - type: f1
106
+ value: 91.259
107
+ name: F1
108
  - task:
109
  type: question-answering
110
  name: Question Answering
111
  dataset:
112
+ name: squadshifts nyt
113
  type: squadshifts
114
  config: nyt
115
  split: test
116
  metrics:
117
+ - type: exact_match
118
+ value: 83.736
119
+ name: Exact Match
120
+ - type: f1
121
+ value: 91.675
122
+ name: F1
123
  - task:
124
  type: question-answering
125
  name: Question Answering
126
  dataset:
127
+ name: squadshifts reddit
128
  type: squadshifts
129
  config: reddit
130
  split: test
131
  metrics:
132
+ - type: exact_match
133
+ value: 72.743
134
+ name: Exact Match
135
+ - type: f1
136
+ value: 84.273
137
+ name: F1
138
  ---
139
 
140
  # flan-t5-base for Extractive QA