zeroMN commited on
Commit
732b624
·
verified ·
1 Parent(s): 1754c5c

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +290 -2
README.md CHANGED
@@ -1,4 +1,294 @@
1
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  language:
3
  - en
4
  - zh
@@ -9,8 +299,6 @@ tags:
9
  - vqa
10
  - text
11
  - audio
12
- datasets:
13
- - synthetic-dataset
14
  metrics:
15
  - accuracy
16
  - bleu
 
1
  ---
2
+ datasets:
3
+ - nyu-mll/glue
4
+ - aps/super_glue
5
+ - facebook/anli
6
+ - tasksource/babi_nli
7
+ - sick
8
+ - snli
9
+ - scitail
10
+ - hans
11
+ - alisawuffles/WANLI
12
+ - tasksource/recast
13
+ - sileod/probability_words_nli
14
+ - joey234/nan-nli
15
+ - pietrolesci/nli_fever
16
+ - pietrolesci/breaking_nli
17
+ - pietrolesci/conj_nli
18
+ - pietrolesci/fracas
19
+ - pietrolesci/dialogue_nli
20
+ - pietrolesci/mpe
21
+ - pietrolesci/dnc
22
+ - pietrolesci/recast_white
23
+ - pietrolesci/joci
24
+ - pietrolesci/robust_nli
25
+ - pietrolesci/robust_nli_is_sd
26
+ - pietrolesci/robust_nli_li_ts
27
+ - pietrolesci/gen_debiased_nli
28
+ - pietrolesci/add_one_rte
29
+ - tasksource/imppres
30
+ - hlgd
31
+ - paws
32
+ - medical_questions_pairs
33
+ - Anthropic/model-written-evals
34
+ - truthful_qa
35
+ - nightingal3/fig-qa
36
+ - tasksource/bigbench
37
+ - blimp
38
+ - cos_e
39
+ - cosmos_qa
40
+ - dream
41
+ - openbookqa
42
+ - qasc
43
+ - quartz
44
+ - quail
45
+ - head_qa
46
+ - sciq
47
+ - social_i_qa
48
+ - wiki_hop
49
+ - wiqa
50
+ - piqa
51
+ - hellaswag
52
+ - pkavumba/balanced-copa
53
+ - 12ml/e-CARE
54
+ - art
55
+ - winogrande
56
+ - codah
57
+ - ai2_arc
58
+ - definite_pronoun_resolution
59
+ - swag
60
+ - math_qa
61
+ - metaeval/utilitarianism
62
+ - mteb/amazon_counterfactual
63
+ - SetFit/insincere-questions
64
+ - SetFit/toxic_conversations
65
+ - turingbench/TuringBench
66
+ - trec
67
+ - tals/vitaminc
68
+ - hope_edi
69
+ - strombergnlp/rumoureval_2019
70
+ - ethos
71
+ - tweet_eval
72
+ - discovery
73
+ - pragmeval
74
+ - silicone
75
+ - lex_glue
76
+ - papluca/language-identification
77
+ - imdb
78
+ - rotten_tomatoes
79
+ - ag_news
80
+ - yelp_review_full
81
+ - financial_phrasebank
82
+ - poem_sentiment
83
+ - dbpedia_14
84
+ - amazon_polarity
85
+ - app_reviews
86
+ - hate_speech18
87
+ - sms_spam
88
+ - humicroedit
89
+ - snips_built_in_intents
90
+ - hate_speech_offensive
91
+ - yahoo_answers_topics
92
+ - pacovaldez/stackoverflow-questions
93
+ - zapsdcn/hyperpartisan_news
94
+ - zapsdcn/sciie
95
+ - zapsdcn/citation_intent
96
+ - go_emotions
97
+ - allenai/scicite
98
+ - liar
99
+ - relbert/lexical_relation_classification
100
+ - tasksource/linguisticprobing
101
+ - tasksource/crowdflower
102
+ - metaeval/ethics
103
+ - emo
104
+ - google_wellformed_query
105
+ - tweets_hate_speech_detection
106
+ - has_part
107
+ - blog_authorship_corpus
108
+ - launch/open_question_type
109
+ - health_fact
110
+ - commonsense_qa
111
+ - mc_taco
112
+ - ade_corpus_v2
113
+ - prajjwal1/discosense
114
+ - circa
115
+ - PiC/phrase_similarity
116
+ - copenlu/scientific-exaggeration-detection
117
+ - quarel
118
+ - mwong/fever-evidence-related
119
+ - numer_sense
120
+ - dynabench/dynasent
121
+ - raquiba/Sarcasm_News_Headline
122
+ - sem_eval_2010_task_8
123
+ - demo-org/auditor_review
124
+ - medmcqa
125
+ - RuyuanWan/Dynasent_Disagreement
126
+ - RuyuanWan/Politeness_Disagreement
127
+ - RuyuanWan/SBIC_Disagreement
128
+ - RuyuanWan/SChem_Disagreement
129
+ - RuyuanWan/Dilemmas_Disagreement
130
+ - lucasmccabe/logiqa
131
+ - wiki_qa
132
+ - tasksource/cycic_classification
133
+ - tasksource/cycic_multiplechoice
134
+ - tasksource/sts-companion
135
+ - tasksource/commonsense_qa_2.0
136
+ - tasksource/lingnli
137
+ - tasksource/monotonicity-entailment
138
+ - tasksource/arct
139
+ - tasksource/scinli
140
+ - tasksource/naturallogic
141
+ - onestop_qa
142
+ - demelin/moral_stories
143
+ - corypaik/prost
144
+ - aps/dynahate
145
+ - metaeval/syntactic-augmentation-nli
146
+ - tasksource/autotnli
147
+ - lasha-nlp/CONDAQA
148
+ - openai/webgpt_comparisons
149
+ - Dahoas/synthetic-instruct-gptj-pairwise
150
+ - metaeval/scruples
151
+ - metaeval/wouldyourather
152
+ - metaeval/defeasible-nli
153
+ - tasksource/help-nli
154
+ - metaeval/nli-veridicality-transitivity
155
+ - tasksource/lonli
156
+ - tasksource/dadc-limit-nli
157
+ - ColumbiaNLP/FLUTE
158
+ - tasksource/strategy-qa
159
+ - openai/summarize_from_feedback
160
+ - tasksource/folio
161
+ - yale-nlp/FOLIO
162
+ - tasksource/tomi-nli
163
+ - tasksource/avicenna
164
+ - stanfordnlp/SHP
165
+ - GBaker/MedQA-USMLE-4-options-hf
166
+ - sileod/wikimedqa
167
+ - declare-lab/cicero
168
+ - amydeng2000/CREAK
169
+ - tasksource/mutual
170
+ - inverse-scaling/NeQA
171
+ - inverse-scaling/quote-repetition
172
+ - inverse-scaling/redefine-math
173
+ - tasksource/puzzte
174
+ - tasksource/implicatures
175
+ - race
176
+ - tasksource/race-c
177
+ - tasksource/spartqa-yn
178
+ - tasksource/spartqa-mchoice
179
+ - tasksource/temporal-nli
180
+ - riddle_sense
181
+ - tasksource/clcd-english
182
+ - maximedb/twentyquestions
183
+ - metaeval/reclor
184
+ - tasksource/counterfactually-augmented-imdb
185
+ - tasksource/counterfactually-augmented-snli
186
+ - metaeval/cnli
187
+ - tasksource/boolq-natural-perturbations
188
+ - metaeval/acceptability-prediction
189
+ - metaeval/equate
190
+ - tasksource/ScienceQA_text_only
191
+ - Jiangjie/ekar_english
192
+ - tasksource/implicit-hate-stg1
193
+ - metaeval/chaos-mnli-ambiguity
194
+ - IlyaGusev/headline_cause
195
+ - tasksource/logiqa-2.0-nli
196
+ - tasksource/oasst2_dense_flat
197
+ - sileod/mindgames
198
+ - metaeval/ambient
199
+ - metaeval/path-naturalness-prediction
200
+ - civil_comments
201
+ - AndyChiang/cloth
202
+ - AndyChiang/dgen
203
+ - tasksource/I2D2
204
+ - webis/args_me
205
+ - webis/Touche23-ValueEval
206
+ - tasksource/starcon
207
+ - PolyAI/banking77
208
+ - tasksource/ConTRoL-nli
209
+ - tasksource/tracie
210
+ - tasksource/sherliic
211
+ - tasksource/sen-making
212
+ - tasksource/winowhy
213
+ - tasksource/robustLR
214
+ - CLUTRR/v1
215
+ - tasksource/logical-fallacy
216
+ - tasksource/parade
217
+ - tasksource/cladder
218
+ - tasksource/subjectivity
219
+ - tasksource/MOH
220
+ - tasksource/VUAC
221
+ - tasksource/TroFi
222
+ - sharc_modified
223
+ - tasksource/conceptrules_v2
224
+ - metaeval/disrpt
225
+ - tasksource/zero-shot-label-nli
226
+ - tasksource/com2sense
227
+ - tasksource/scone
228
+ - tasksource/winodict
229
+ - tasksource/fool-me-twice
230
+ - tasksource/monli
231
+ - tasksource/corr2cause
232
+ - lighteval/lsat_qa
233
+ - tasksource/apt
234
+ - zeroshot/twitter-financial-news-sentiment
235
+ - tasksource/icl-symbol-tuning-instruct
236
+ - tasksource/SpaceNLI
237
+ - sihaochen/propsegment
238
+ - HannahRoseKirk/HatemojiBuild
239
+ - tasksource/regset
240
+ - tasksource/esci
241
+ - lmsys/chatbot_arena_conversations
242
+ - neurae/dnd_style_intents
243
+ - hitachi-nlp/FLD.v2
244
+ - tasksource/SDOH-NLI
245
+ - allenai/scifact_entailment
246
+ - tasksource/feasibilityQA
247
+ - tasksource/simple_pair
248
+ - tasksource/AdjectiveScaleProbe-nli
249
+ - tasksource/resnli
250
+ - tasksource/SpaRTUN
251
+ - tasksource/ReSQ
252
+ - tasksource/semantic_fragments_nli
253
+ - MoritzLaurer/dataset_train_nli
254
+ - tasksource/stepgame
255
+ - tasksource/nlgraph
256
+ - tasksource/oasst2_pairwise_rlhf_reward
257
+ - tasksource/hh-rlhf
258
+ - tasksource/ruletaker
259
+ - qbao775/PARARULE-Plus
260
+ - tasksource/proofwriter
261
+ - tasksource/logical-entailment
262
+ - tasksource/nope
263
+ - tasksource/LogicNLI
264
+ - kiddothe2b/contract-nli
265
+ - AshtonIsNotHere/nli4ct_semeval2024
266
+ - tasksource/lsat-ar
267
+ - tasksource/lsat-rc
268
+ - AshtonIsNotHere/biosift-nli
269
+ - tasksource/brainteasers
270
+ - Anthropic/persuasion
271
+ - erbacher/AmbigNQ-clarifying-question
272
+ - tasksource/SIGA-nli
273
+ - unigram/FOL-nli
274
+ - tasksource/goal-step-wikihow
275
+ - GGLab/PARADISE
276
+ - tasksource/doc-nli
277
+ - tasksource/mctest-nli
278
+ - tasksource/patent-phrase-similarity
279
+ - tasksource/natural-language-satisfiability
280
+ - tasksource/idioms-nli
281
+ - tasksource/lifecycle-entailment
282
+ - nvidia/HelpSteer
283
+ - nvidia/HelpSteer2
284
+ - sadat2307/MSciNLI
285
+ - pushpdeep/UltraFeedback-paired
286
+ - tasksource/AES2-essay-scoring
287
+ - tasksource/english-grading
288
+ - tasksource/wice
289
+ - Dzeniks/hover
290
+ - sileod/missing-item-prediction
291
+ - tasksource/tasksource_dpo_pairs
292
  language:
293
  - en
294
  - zh
 
299
  - vqa
300
  - text
301
  - audio
 
 
302
  metrics:
303
  - accuracy
304
  - bleu