sileod commited on
Commit
2296a6b
1 Parent(s): 89f2c42

Upload DebertaV2ForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +301 -221
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -31,8 +31,8 @@
31
  2,
32
  2,
33
  2,
34
- 6,
35
  2,
 
36
  2,
37
  2,
38
  2,
@@ -46,12 +46,10 @@
46
  3,
47
  3,
48
  2,
49
- 3,
50
  2,
51
  2,
52
  2,
53
- 3,
54
- 3,
55
  3,
56
  3,
57
  3,
@@ -62,12 +60,6 @@
62
  3,
63
  2,
64
  2,
65
- 3,
66
- 3,
67
- 3,
68
- 3,
69
- 3,
70
- 3,
71
  2,
72
  3,
73
  3,
@@ -77,23 +69,6 @@
77
  3,
78
  3,
79
  3,
80
- 3,
81
- 3,
82
- 3,
83
- 3,
84
- 3,
85
- 3,
86
- 3,
87
- 3,
88
- 3,
89
- 3,
90
- 3,
91
- 3,
92
- 3,
93
- 3,
94
- 3,
95
- 3,
96
- 2,
97
  2,
98
  2,
99
  2,
@@ -243,45 +218,45 @@
243
  4,
244
  2,
245
  8,
246
- 3,
247
- 3,
248
  2,
249
  2,
250
  3,
251
  3,
252
- 20,
253
- 4,
254
  3,
255
- 2,
256
  3,
257
- 174,
258
  3,
259
- 51,
260
- 41,
 
261
  2,
262
  2,
263
  2,
264
  2,
265
  2,
 
 
 
266
  2,
 
267
  18,
 
 
268
  2,
 
269
  2,
270
  2,
271
  8,
272
  2,
273
- 3,
274
- 16,
275
- 17,
276
- 3,
277
  2,
 
 
 
 
278
  42,
279
  3,
280
- 7,
281
  12,
282
- 3,
283
- 7,
284
- 4,
285
  11,
286
  100,
287
  13,
@@ -303,7 +278,6 @@
303
  1,
304
  3,
305
  10,
306
- 77,
307
  3,
308
  10,
309
  4,
@@ -313,33 +287,33 @@
313
  28,
314
  3,
315
  6,
316
- 6,
317
  5,
318
  7,
319
- 4,
320
  3,
321
  6,
 
 
 
 
322
  2,
323
  2,
324
  2,
325
- 20,
326
- 7,
327
  2,
328
  2,
 
329
  2,
330
  2,
331
  3,
332
  4,
333
- 3,
334
  2,
335
  4,
336
- 9,
337
  13,
338
  2,
339
  2,
340
  2,
341
  2,
342
- 2,
343
  4,
344
  1,
345
  2,
@@ -365,12 +339,6 @@
365
  3,
366
  2,
367
  2,
368
- 2,
369
- 2,
370
- 2,
371
- 3,
372
- 2,
373
- 2,
374
  12,
375
  3,
376
  3,
@@ -378,7 +346,6 @@
378
  19,
379
  3,
380
  1,
381
- 1,
382
  2,
383
  2,
384
  2,
@@ -411,6 +378,7 @@
411
  2,
412
  2,
413
  2,
 
414
  3,
415
  2,
416
  2,
@@ -453,6 +421,78 @@
453
  3,
454
  2,
455
  1,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
456
  1
457
  ],
458
  "hidden_act": "gelu",
@@ -512,14 +552,14 @@
512
  "scitail/snli_format",
513
  "hans",
514
  "WANLI",
515
- "recast/recast_verbnet",
516
  "recast/recast_ner",
517
- "recast/recast_factuality",
 
 
518
  "recast/recast_puns",
519
  "recast/recast_kg_relations",
520
- "recast/recast_megaveridicality",
521
  "recast/recast_verbcorner",
522
- "recast/recast_sentiment",
523
  "probability_words_nli/usnli",
524
  "probability_words_nli/reasoning_2hop",
525
  "probability_words_nli/reasoning_1hop",
@@ -531,12 +571,10 @@
531
  "dialogue_nli",
532
  "mpe",
533
  "dnc",
534
- "gpt3_nli",
535
  "recast_white/fnplus",
536
  "recast_white/sprl",
537
  "recast_white/dpr",
538
  "joci",
539
- "contrast_nli",
540
  "robust_nli/IS_CS",
541
  "robust_nli/LI_LI",
542
  "robust_nli/ST_WO",
@@ -547,41 +585,18 @@
547
  "robust_nli/ST_LM",
548
  "robust_nli_is_sd",
549
  "robust_nli_li_ts",
550
- "gen_debiased_nli/snli_seq_z",
551
- "gen_debiased_nli/snli_z_aug",
552
- "gen_debiased_nli/snli_par_z",
553
- "gen_debiased_nli/mnli_par_z",
554
- "gen_debiased_nli/mnli_z_aug",
555
- "gen_debiased_nli/mnli_seq_z",
556
  "add_one_rte",
557
- "imppres/presupposition_only_presupposition/presupposition",
558
- "imppres/presupposition_question_presupposition/presupposition",
559
- "imppres/presupposition_cleft_uniqueness/presupposition",
560
- "imppres/presupposition_both_presupposition/presupposition",
561
- "imppres/presupposition_all_n_presupposition/presupposition",
562
- "imppres/presupposition_change_of_state/presupposition",
563
- "imppres/presupposition_possessed_definites_existence/presupposition",
564
- "imppres/presupposition_possessed_definites_uniqueness/presupposition",
565
- "imppres/presupposition_cleft_existence/presupposition",
566
- "imppres/implicature_numerals_2_3/prag",
567
- "imppres/implicature_connectives/prag",
568
- "imppres/implicature_gradable_adjective/prag",
569
- "imppres/implicature_gradable_verb/prag",
570
- "imppres/implicature_modals/prag",
571
- "imppres/implicature_numerals_10_100/prag",
572
- "imppres/implicature_quantifiers/prag",
573
  "imppres/implicature_gradable_verb/log",
574
- "imppres/implicature_modals/log",
575
- "imppres/implicature_numerals_10_100/log",
576
- "imppres/implicature_numerals_2_3/log",
577
  "imppres/implicature_quantifiers/log",
578
  "imppres/implicature_connectives/log",
 
 
579
  "imppres/implicature_gradable_adjective/log",
 
580
  "glue_diagnostics/diagnostics",
581
  "hlgd",
582
  "paws/labeled_final",
583
  "paws/labeled_swap",
584
- "quora",
585
  "medical_questions_pairs",
586
  "conll2003/pos_tags",
587
  "conll2003/chunk_tags",
@@ -590,106 +605,106 @@
590
  "model-written-evals",
591
  "truthful_qa/multiple_choice",
592
  "fig-qa",
593
- "bigbench/entailed_polarity",
594
- "bigbench/logical_args",
595
- "bigbench/sports_understanding",
596
- "bigbench/color",
597
- "bigbench/goal_step_wikihow",
598
- "bigbench/fantasy_reasoning",
599
- "bigbench/navigate",
600
- "bigbench/known_unknowns",
601
- "bigbench/real_or_fake_text",
602
- "bigbench/novel_concepts",
603
  "bigbench/logical_sequence",
604
- "bigbench/crass_ai",
605
- "bigbench/identify_odd_metaphor",
606
- "bigbench/arithmetic",
607
- "bigbench/elementary_math_qa",
608
- "bigbench/cifar10_classification",
609
- "bigbench/riddle_sense",
610
- "bigbench/salient_translation_error_detection",
611
- "bigbench/tracking_shuffled_objects",
 
 
 
 
 
 
 
 
612
  "bigbench/dark_humor_detection",
613
- "bigbench/mathematical_induction",
614
- "bigbench/implicit_relations",
615
- "bigbench/logic_grid_puzzle",
616
- "bigbench/analytic_entailment",
617
- "bigbench/temporal_sequences",
618
- "bigbench/question_selection",
619
  "bigbench/odd_one_out",
620
- "bigbench/international_phonetic_alphabet_nli",
621
- "bigbench/nonsense_words_grammar",
622
- "bigbench/play_dialog_same_or_different",
623
- "bigbench/winowhy",
624
- "bigbench/causal_judgment",
 
625
  "bigbench/disambiguation_qa",
626
- "bigbench/conceptual_combinations",
 
 
 
 
 
 
627
  "bigbench/evaluating_information_essentiality",
628
- "bigbench/code_line_description",
629
- "bigbench/physics",
630
- "bigbench/moral_permissibility",
631
- "bigbench/ruin_names",
632
- "bigbench/misconceptions",
633
- "bigbench/general_knowledge",
634
- "bigbench/phrase_relatedness",
635
- "bigbench/unit_interpretation",
636
- "bigbench/contextual_parametric_knowledge_conflicts",
637
  "bigbench/fact_checker",
 
 
638
  "bigbench/identify_math_theorems",
639
- "bigbench/logical_fallacy_detection",
640
- "bigbench/suicide_risk",
641
  "bigbench/cause_and_effect",
642
- "bigbench/timedial",
643
- "bigbench/key_value_maps",
 
 
 
 
 
 
 
 
644
  "bigbench/irony_identification",
645
- "bigbench/emojis_emotion_prediction",
646
- "bigbench/reasoning_about_colored_objects",
647
  "bigbench/hindu_knowledge",
648
- "bigbench/authorship_verification",
649
- "bigbench/human_organs_senses",
650
  "bigbench/mnist_ascii",
651
- "bigbench/epistemic_reasoning",
652
- "bigbench/metaphor_boolean",
653
- "bigbench/strategyqa",
654
- "bigbench/intent_recognition",
655
- "bigbench/metaphor_understanding",
656
- "bigbench/movie_recommendation",
657
- "bigbench/sentence_ambiguity",
658
- "bigbench/hhh_alignment",
659
- "bigbench/emoji_movie",
660
- "bigbench/geometric_shapes",
661
- "bigbench/social_iqa",
662
- "bigbench/abstract_narrative_understanding",
663
- "bigbench/penguins_in_a_table",
664
- "bigbench/anachronisms",
665
  "bigbench/formal_fallacies_syllogisms_negation",
666
- "bigbench/strange_stories",
667
- "bigbench/cs_algorithms",
668
- "bigbench/physical_intuition",
669
- "bigbench/simple_ethical_questions",
670
- "bigbench/similarities_abstraction",
671
- "bigbench/symbol_interpretation",
672
  "bigbench/bbq_lite_json",
673
- "bigbench/movie_dialog_same_or_different",
674
- "bigbench/dyck_languages",
 
675
  "bigbench/analogical_similarity",
676
- "bigbench/logical_deduction",
677
- "bigbench/snarks",
678
- "bigbench/social_support",
679
- "bigbench/empirical_judgments",
680
- "bigbench/date_understanding",
681
- "bigbench/presuppositions_as_nli",
682
- "bigbench/implicatures",
683
- "bigbench/vitaminc_fact_verification",
684
- "bigbench/checkmate_in_one",
685
- "bigbench/gre_reading_comprehension",
686
- "bigbench/undo_permutation",
687
  "bigbench/english_proverbs",
688
- "bigbench/discourse_marker_prediction",
 
 
 
689
  "bigbench/understanding_fables",
690
- "bigbench/figure_of_speech_detection",
691
- "bigbench/hyperbaton",
 
 
 
 
 
 
 
 
 
692
  "bigbench/crash_blossom",
 
 
 
 
 
 
 
 
 
693
  "cos_e/v1.0",
694
  "cosmos_qa",
695
  "dream",
@@ -700,7 +715,7 @@
700
  "head_qa/en",
701
  "sciq",
702
  "social_i_qa",
703
- "wiki_hop",
704
  "wiqa",
705
  "piqa",
706
  "hellaswag",
@@ -713,7 +728,7 @@
713
  "ai2_arc/ARC-Challenge/challenge",
714
  "ai2_arc/ARC-Easy/challenge",
715
  "definite_pronoun_resolution",
716
- "swag",
717
  "math_qa",
718
  "glue/cola",
719
  "glue/sst2",
@@ -728,45 +743,45 @@
728
  "rumoureval_2019/RumourEval2019",
729
  "ethos/binary",
730
  "ethos/multilabel",
731
- "tweet_eval/stance_feminist",
732
- "tweet_eval/stance_climate",
733
  "tweet_eval/irony",
734
  "tweet_eval/offensive",
735
  "tweet_eval/sentiment",
 
 
 
 
736
  "tweet_eval/stance_hillary",
737
  "tweet_eval/emoji",
738
- "tweet_eval/emotion",
739
- "tweet_eval/stance_atheism",
740
- "tweet_eval/hate",
741
- "tweet_eval/stance_abortion",
742
  "discovery/discovery",
743
- "pragmeval/verifiability",
744
- "pragmeval/mrda",
745
- "pragmeval/switchboard",
746
- "pragmeval/emobank-arousal",
747
- "pragmeval/emobank-dominance",
748
- "pragmeval/squinky-informativeness",
749
- "pragmeval/squinky-implicature",
750
  "pragmeval/squinky-formality",
751
  "pragmeval/emobank-valence",
 
 
 
 
 
 
 
 
752
  "pragmeval/stac",
753
- "pragmeval/persuasiveness-strength",
754
- "pragmeval/persuasiveness-specificity",
755
- "pragmeval/persuasiveness-relevance",
756
- "pragmeval/persuasiveness-premisetype",
757
- "pragmeval/persuasiveness-eloquence",
758
  "pragmeval/persuasiveness-claimtype",
 
759
  "pragmeval/pdtb",
760
- "pragmeval/gum",
761
- "pragmeval/emergent",
762
  "pragmeval/sarcasm",
763
- "silicone/oasis",
764
- "silicone/meld_s",
765
- "silicone/meld_e",
766
- "silicone/maptask",
767
- "silicone/sem",
768
  "silicone/dyda_e",
769
  "silicone/dyda_da",
 
 
 
 
 
770
  "silicone/iemocap",
771
  "lex_glue/eurlex",
772
  "lex_glue/scotus",
@@ -788,7 +803,6 @@
788
  "humicroedit/subtask-1",
789
  "humicroedit/subtask-2",
790
  "snips_built_in_intents",
791
- "banking77",
792
  "hate_speech_offensive",
793
  "yahoo_answers_topics",
794
  "stackoverflow-questions",
@@ -798,29 +812,29 @@
798
  "go_emotions/simplified",
799
  "scicite",
800
  "liar",
801
- "lexical_relation_classification/BLESS",
802
  "lexical_relation_classification/CogALexV",
803
  "lexical_relation_classification/EVALution",
804
- "lexical_relation_classification/K&H+N",
805
  "lexical_relation_classification/ROOT09",
806
- "linguisticprobing/sentence_length",
 
807
  "linguisticprobing/bigram_shift",
 
 
 
 
 
808
  "linguisticprobing/odd_man_out",
809
  "linguisticprobing/coordination_inversion",
810
- "linguisticprobing/top_constituents",
811
  "linguisticprobing/tree_depth",
812
- "linguisticprobing/past_present",
813
- "linguisticprobing/obj_number",
814
- "linguisticprobing/subj_number",
815
  "crowdflower/political-media-audience",
816
  "crowdflower/economic-news",
817
- "crowdflower/corporate-messaging",
818
- "crowdflower/airline-sentiment",
819
- "crowdflower/tweet_global_warming",
820
  "crowdflower/sentiment_nuclear_power",
821
  "crowdflower/political-media-message",
822
- "crowdflower/text_emotion",
823
  "crowdflower/political-media-bias",
 
 
 
824
  "ethics/commonsense",
825
  "ethics/deontology",
826
  "ethics/justice",
@@ -846,12 +860,6 @@
846
  "discosense",
847
  "circa",
848
  "EffectiveFeedbackStudentWriting",
849
- "promptSentiment",
850
- "promptNLI",
851
- "promptSpoke",
852
- "promptProficiency",
853
- "promptGrammar",
854
- "promptCoherence",
855
  "phrase_similarity",
856
  "scientific-exaggeration-detection",
857
  "quarel",
@@ -863,7 +871,6 @@
863
  "sem_eval_2010_task_8",
864
  "auditor_review/demo-org--auditor_review",
865
  "medmcqa",
866
- "aqua_rat/tokenized",
867
  "Dynasent_Disagreement",
868
  "Politeness_Disagreement",
869
  "SBIC_Disagreement",
@@ -892,8 +899,9 @@
892
  "scruples",
893
  "wouldyourather",
894
  "attempto-nli",
895
- "defeasible-nli/snli",
896
  "defeasible-nli/atomic",
 
 
897
  "nli-veridicality-transitivity",
898
  "natural-language-satisfiability",
899
  "lonli",
@@ -936,12 +944,84 @@
936
  "implicit-hate-stg1",
937
  "chaos-mnli-ambiguity",
938
  "headline_cause/en_simple",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
939
  "babi_nli",
 
 
 
940
  "blimp-2",
941
  "mmlu-4"
942
  ],
943
  "torch_dtype": "float32",
944
- "transformers_version": "4.26.0",
945
  "type_vocab_size": 0,
946
  "vocab_size": 128100
947
  }
 
31
  2,
32
  2,
33
  2,
 
34
  2,
35
+ 6,
36
  2,
37
  2,
38
  2,
 
46
  3,
47
  3,
48
  2,
 
49
  2,
50
  2,
51
  2,
52
+ 5,
 
53
  3,
54
  3,
55
  3,
 
60
  3,
61
  2,
62
  2,
 
 
 
 
 
 
63
  2,
64
  3,
65
  3,
 
69
  3,
70
  3,
71
  3,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
72
  2,
73
  2,
74
  2,
 
218
  4,
219
  2,
220
  8,
221
+ 2,
222
+ 4,
223
  2,
224
  2,
225
  3,
226
  3,
 
 
227
  3,
 
228
  3,
 
229
  3,
230
+ 3,
231
+ 20,
232
+ 174,
233
  2,
234
  2,
235
  2,
236
  2,
237
  2,
238
+ 41,
239
+ 51,
240
+ 3,
241
  2,
242
+ 3,
243
  18,
244
+ 17,
245
+ 3,
246
  2,
247
+ 16,
248
  2,
249
  2,
250
  8,
251
  2,
 
 
 
 
252
  2,
253
+ 7,
254
+ 4,
255
+ 7,
256
+ 3,
257
  42,
258
  3,
 
259
  12,
 
 
 
260
  11,
261
  100,
262
  13,
 
278
  1,
279
  3,
280
  10,
 
281
  3,
282
  10,
283
  4,
 
287
  28,
288
  3,
289
  6,
 
290
  5,
291
  7,
 
292
  3,
293
  6,
294
+ 4,
295
+ 2,
296
+ 20,
297
+ 6,
298
  2,
299
  2,
300
  2,
 
 
301
  2,
302
  2,
303
+ 7,
304
  2,
305
  2,
306
  3,
307
  4,
308
+ 9,
309
  2,
310
  4,
311
+ 3,
312
  13,
313
  2,
314
  2,
315
  2,
316
  2,
 
317
  4,
318
  1,
319
  2,
 
339
  3,
340
  2,
341
  2,
 
 
 
 
 
 
342
  12,
343
  3,
344
  3,
 
346
  19,
347
  3,
348
  1,
 
349
  2,
350
  2,
351
  2,
 
378
  2,
379
  2,
380
  2,
381
+ 2,
382
  3,
383
  2,
384
  2,
 
421
  3,
422
  2,
423
  1,
424
+ 1,
425
+ 1,
426
+ 2,
427
+ 2,
428
+ 50,
429
+ 50,
430
+ 50,
431
+ 50,
432
+ 2,
433
+ 1,
434
+ 1,
435
+ 1,
436
+ 1,
437
+ 1,
438
+ 1,
439
+ 1,
440
+ 1,
441
+ 1,
442
+ 1,
443
+ 1,
444
+ 2,
445
+ 2,
446
+ 2,
447
+ 2,
448
+ 77,
449
+ 2,
450
+ 1,
451
+ 3,
452
+ 2,
453
+ 2,
454
+ 1,
455
+ 1,
456
+ 2,
457
+ 2,
458
+ 2,
459
+ 2,
460
+ 2,
461
+ 2,
462
+ 2,
463
+ 2,
464
+ 2,
465
+ 3,
466
+ 18,
467
+ 13,
468
+ 2,
469
+ 2,
470
+ 2,
471
+ 2,
472
+ 2,
473
+ 2,
474
+ 4,
475
+ 2,
476
+ 24,
477
+ 23,
478
+ 67,
479
+ 279,
480
+ 3,
481
+ 2,
482
+ 2,
483
+ 1,
484
+ 2,
485
+ 2,
486
+ 3,
487
+ 1,
488
+ 2,
489
+ 3,
490
+ 3,
491
+ 2,
492
+ 3,
493
+ 3,
494
+ 3,
495
+ 1,
496
  1
497
  ],
498
  "hidden_act": "gelu",
 
552
  "scitail/snli_format",
553
  "hans",
554
  "WANLI",
 
555
  "recast/recast_ner",
556
+ "recast/recast_sentiment",
557
+ "recast/recast_megaveridicality",
558
+ "recast/recast_verbnet",
559
  "recast/recast_puns",
560
  "recast/recast_kg_relations",
 
561
  "recast/recast_verbcorner",
562
+ "recast/recast_factuality",
563
  "probability_words_nli/usnli",
564
  "probability_words_nli/reasoning_2hop",
565
  "probability_words_nli/reasoning_1hop",
 
571
  "dialogue_nli",
572
  "mpe",
573
  "dnc",
 
574
  "recast_white/fnplus",
575
  "recast_white/sprl",
576
  "recast_white/dpr",
577
  "joci",
 
578
  "robust_nli/IS_CS",
579
  "robust_nli/LI_LI",
580
  "robust_nli/ST_WO",
 
585
  "robust_nli/ST_LM",
586
  "robust_nli_is_sd",
587
  "robust_nli_li_ts",
 
 
 
 
 
 
588
  "add_one_rte",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
589
  "imppres/implicature_gradable_verb/log",
 
 
 
590
  "imppres/implicature_quantifiers/log",
591
  "imppres/implicature_connectives/log",
592
+ "imppres/implicature_numerals_2_3/log",
593
+ "imppres/implicature_numerals_10_100/log",
594
  "imppres/implicature_gradable_adjective/log",
595
+ "imppres/implicature_modals/log",
596
  "glue_diagnostics/diagnostics",
597
  "hlgd",
598
  "paws/labeled_final",
599
  "paws/labeled_swap",
 
600
  "medical_questions_pairs",
601
  "conll2003/pos_tags",
602
  "conll2003/chunk_tags",
 
605
  "model-written-evals",
606
  "truthful_qa/multiple_choice",
607
  "fig-qa",
 
 
 
 
 
 
 
 
 
 
608
  "bigbench/logical_sequence",
609
+ "bigbench/snarks",
610
+ "bigbench/general_knowledge",
611
+ "bigbench/moral_permissibility",
612
+ "bigbench/figure_of_speech_detection",
613
+ "bigbench/abstract_narrative_understanding",
614
+ "bigbench/anachronisms",
615
+ "bigbench/vitaminc_fact_verification",
616
+ "bigbench/authorship_verification",
617
+ "bigbench/penguins_in_a_table",
618
+ "bigbench/play_dialog_same_or_different",
619
+ "bigbench/physical_intuition",
620
+ "bigbench/empirical_judgments",
621
+ "bigbench/checkmate_in_one",
622
+ "bigbench/metaphor_understanding",
623
+ "bigbench/cs_algorithms",
624
+ "bigbench/dyck_languages",
625
  "bigbench/dark_humor_detection",
626
+ "bigbench/fantasy_reasoning",
 
 
 
 
 
627
  "bigbench/odd_one_out",
628
+ "bigbench/epistemic_reasoning",
629
+ "bigbench/identify_odd_metaphor",
630
+ "bigbench/discourse_marker_prediction",
631
+ "bigbench/question_selection",
632
+ "bigbench/geometric_shapes",
633
+ "bigbench/date_understanding",
634
  "bigbench/disambiguation_qa",
635
+ "bigbench/strategyqa",
636
+ "bigbench/color",
637
+ "bigbench/elementary_math_qa",
638
+ "bigbench/mathematical_induction",
639
+ "bigbench/strange_stories",
640
+ "bigbench/logical_args",
641
+ "bigbench/cifar10_classification",
642
  "bigbench/evaluating_information_essentiality",
643
+ "bigbench/novel_concepts",
644
+ "bigbench/hyperbaton",
 
 
 
 
 
 
 
645
  "bigbench/fact_checker",
646
+ "bigbench/sentence_ambiguity",
647
+ "bigbench/social_iqa",
648
  "bigbench/identify_math_theorems",
 
 
649
  "bigbench/cause_and_effect",
650
+ "bigbench/misconceptions",
651
+ "bigbench/causal_judgment",
652
+ "bigbench/international_phonetic_alphabet_nli",
653
+ "bigbench/implicit_relations",
654
+ "bigbench/salient_translation_error_detection",
655
+ "bigbench/logical_deduction",
656
+ "bigbench/known_unknowns",
657
+ "bigbench/arithmetic",
658
+ "bigbench/sports_understanding",
659
+ "bigbench/navigate",
660
  "bigbench/irony_identification",
 
 
661
  "bigbench/hindu_knowledge",
 
 
662
  "bigbench/mnist_ascii",
663
+ "bigbench/social_support",
664
+ "bigbench/presuppositions_as_nli",
665
+ "bigbench/tracking_shuffled_objects",
666
+ "bigbench/winowhy",
 
 
 
 
 
 
 
 
 
 
667
  "bigbench/formal_fallacies_syllogisms_negation",
668
+ "bigbench/emoji_movie",
669
+ "bigbench/code_line_description",
670
+ "bigbench/logical_fallacy_detection",
671
+ "bigbench/intent_recognition",
 
 
672
  "bigbench/bbq_lite_json",
673
+ "bigbench/metaphor_boolean",
674
+ "bigbench/analytic_entailment",
675
+ "bigbench/unit_interpretation",
676
  "bigbench/analogical_similarity",
677
+ "bigbench/symbol_interpretation",
678
+ "bigbench/contextual_parametric_knowledge_conflicts",
679
+ "bigbench/conceptual_combinations",
680
+ "bigbench/temporal_sequences",
 
 
 
 
 
 
 
681
  "bigbench/english_proverbs",
682
+ "bigbench/gre_reading_comprehension",
683
+ "bigbench/suicide_risk",
684
+ "bigbench/emojis_emotion_prediction",
685
+ "bigbench/phrase_relatedness",
686
  "bigbench/understanding_fables",
687
+ "bigbench/riddle_sense",
688
+ "bigbench/ruin_names",
689
+ "bigbench/physics",
690
+ "bigbench/reasoning_about_colored_objects",
691
+ "bigbench/timedial",
692
+ "bigbench/hhh_alignment",
693
+ "bigbench/nonsense_words_grammar",
694
+ "bigbench/crass_ai",
695
+ "bigbench/undo_permutation",
696
+ "bigbench/simple_ethical_questions",
697
+ "bigbench/movie_recommendation",
698
  "bigbench/crash_blossom",
699
+ "bigbench/entailed_polarity",
700
+ "bigbench/goal_step_wikihow",
701
+ "bigbench/key_value_maps",
702
+ "bigbench/real_or_fake_text",
703
+ "bigbench/human_organs_senses",
704
+ "bigbench/logic_grid_puzzle",
705
+ "bigbench/implicatures",
706
+ "bigbench/similarities_abstraction",
707
+ "bigbench/movie_dialog_same_or_different",
708
  "cos_e/v1.0",
709
  "cosmos_qa",
710
  "dream",
 
715
  "head_qa/en",
716
  "sciq",
717
  "social_i_qa",
718
+ "wiki_hop/original",
719
  "wiqa",
720
  "piqa",
721
  "hellaswag",
 
728
  "ai2_arc/ARC-Challenge/challenge",
729
  "ai2_arc/ARC-Easy/challenge",
730
  "definite_pronoun_resolution",
731
+ "swag/regular",
732
  "math_qa",
733
  "glue/cola",
734
  "glue/sst2",
 
743
  "rumoureval_2019/RumourEval2019",
744
  "ethos/binary",
745
  "ethos/multilabel",
746
+ "tweet_eval/hate",
747
+ "tweet_eval/emotion",
748
  "tweet_eval/irony",
749
  "tweet_eval/offensive",
750
  "tweet_eval/sentiment",
751
+ "tweet_eval/stance_abortion",
752
+ "tweet_eval/stance_atheism",
753
+ "tweet_eval/stance_climate",
754
+ "tweet_eval/stance_feminist",
755
  "tweet_eval/stance_hillary",
756
  "tweet_eval/emoji",
 
 
 
 
757
  "discovery/discovery",
 
 
 
 
 
 
 
758
  "pragmeval/squinky-formality",
759
  "pragmeval/emobank-valence",
760
+ "pragmeval/emobank-dominance",
761
+ "pragmeval/squinky-implicature",
762
+ "pragmeval/squinky-informativeness",
763
+ "pragmeval/switchboard",
764
+ "pragmeval/mrda",
765
+ "pragmeval/verifiability",
766
+ "pragmeval/emobank-arousal",
767
+ "pragmeval/emergent",
768
  "pragmeval/stac",
769
+ "pragmeval/gum",
 
 
 
 
770
  "pragmeval/persuasiveness-claimtype",
771
+ "pragmeval/persuasiveness-eloquence",
772
  "pragmeval/pdtb",
773
+ "pragmeval/persuasiveness-relevance",
 
774
  "pragmeval/sarcasm",
775
+ "pragmeval/persuasiveness-premisetype",
776
+ "pragmeval/persuasiveness-strength",
777
+ "pragmeval/persuasiveness-specificity",
 
 
778
  "silicone/dyda_e",
779
  "silicone/dyda_da",
780
+ "silicone/meld_e",
781
+ "silicone/meld_s",
782
+ "silicone/oasis",
783
+ "silicone/sem",
784
+ "silicone/maptask",
785
  "silicone/iemocap",
786
  "lex_glue/eurlex",
787
  "lex_glue/scotus",
 
803
  "humicroedit/subtask-1",
804
  "humicroedit/subtask-2",
805
  "snips_built_in_intents",
 
806
  "hate_speech_offensive",
807
  "yahoo_answers_topics",
808
  "stackoverflow-questions",
 
812
  "go_emotions/simplified",
813
  "scicite",
814
  "liar",
 
815
  "lexical_relation_classification/CogALexV",
816
  "lexical_relation_classification/EVALution",
 
817
  "lexical_relation_classification/ROOT09",
818
+ "lexical_relation_classification/BLESS",
819
+ "lexical_relation_classification/K&H+N",
820
  "linguisticprobing/bigram_shift",
821
+ "linguisticprobing/top_constituents",
822
+ "linguisticprobing/sentence_length",
823
+ "linguisticprobing/subj_number",
824
+ "linguisticprobing/obj_number",
825
+ "linguisticprobing/past_present",
826
  "linguisticprobing/odd_man_out",
827
  "linguisticprobing/coordination_inversion",
 
828
  "linguisticprobing/tree_depth",
829
+ "crowdflower/tweet_global_warming",
 
 
830
  "crowdflower/political-media-audience",
831
  "crowdflower/economic-news",
 
 
 
832
  "crowdflower/sentiment_nuclear_power",
833
  "crowdflower/political-media-message",
 
834
  "crowdflower/political-media-bias",
835
+ "crowdflower/corporate-messaging",
836
+ "crowdflower/airline-sentiment",
837
+ "crowdflower/text_emotion",
838
  "ethics/commonsense",
839
  "ethics/deontology",
840
  "ethics/justice",
 
860
  "discosense",
861
  "circa",
862
  "EffectiveFeedbackStudentWriting",
 
 
 
 
 
 
863
  "phrase_similarity",
864
  "scientific-exaggeration-detection",
865
  "quarel",
 
871
  "sem_eval_2010_task_8",
872
  "auditor_review/demo-org--auditor_review",
873
  "medmcqa",
 
874
  "Dynasent_Disagreement",
875
  "Politeness_Disagreement",
876
  "SBIC_Disagreement",
 
899
  "scruples",
900
  "wouldyourather",
901
  "attempto-nli",
 
902
  "defeasible-nli/atomic",
903
+ "defeasible-nli/snli",
904
+ "help-nli",
905
  "nli-veridicality-transitivity",
906
  "natural-language-satisfiability",
907
  "lonli",
 
944
  "implicit-hate-stg1",
945
  "chaos-mnli-ambiguity",
946
  "headline_cause/en_simple",
947
+ "logiqa-2.0-nli",
948
+ "oasst1_dense_flat/quality",
949
+ "oasst1_dense_flat/toxicity",
950
+ "oasst1_dense_flat/helpfulness",
951
+ "PARARULE-Plus",
952
+ "mindgames",
953
+ "universal_dependencies/en_ewt/deprel",
954
+ "universal_dependencies/en_gum/deprel",
955
+ "universal_dependencies/en_lines/deprel",
956
+ "universal_dependencies/en_partut/deprel",
957
+ "ambient",
958
+ "path-naturalness-prediction",
959
+ "civil_comments/toxicity",
960
+ "civil_comments/severe_toxicity",
961
+ "civil_comments/obscene",
962
+ "civil_comments/threat",
963
+ "civil_comments/insult",
964
+ "civil_comments/identity_attack",
965
+ "civil_comments/sexual_explicit",
966
+ "cloth",
967
+ "dgen",
968
+ "oasst1_pairwise_rlhf_reward",
969
+ "I2D2",
970
+ "args_me",
971
+ "Touche23-ValueEval",
972
+ "starcon",
973
+ "banking77",
974
+ "ruletaker",
975
+ "lsat_qa/all",
976
+ "ConTRoL-nli",
977
+ "tracie",
978
+ "sherliic",
979
+ "sen-making/1",
980
+ "sen-making/2",
981
+ "winowhy",
982
+ "mbib-base/cognitive-bias",
983
+ "mbib-base/fake-news",
984
+ "mbib-base/gender-bias",
985
+ "mbib-base/hate-speech",
986
+ "mbib-base/linguistic-bias",
987
+ "mbib-base/political-bias",
988
+ "mbib-base/racial-bias",
989
+ "mbib-base/text-level-bias",
990
+ "robustLR",
991
+ "v1/gen_train234_test2to10",
992
+ "logical-fallacy",
993
+ "parade",
994
+ "cladder",
995
+ "subjectivity",
996
+ "MOH",
997
+ "VUAC",
998
+ "TroFi",
999
+ "sharc_modified/mod",
1000
+ "conceptrules_v2",
1001
+ "disrpt/eng.dep.scidtb",
1002
+ "conll2000",
1003
+ "few-nerd/supervised",
1004
+ "finer-139",
1005
+ "zero-shot-label-nli",
1006
+ "com2sense",
1007
+ "scone",
1008
+ "winodict",
1009
+ "fool-me-twice",
1010
+ "monli",
1011
+ "corr2cause",
1012
+ "lsat_qa/all",
1013
+ "apt",
1014
+ "twitter-financial-news-sentiment",
1015
+ "SpaceNLI",
1016
  "babi_nli",
1017
+ "gen_debiased_nli",
1018
+ "imppres/presupposition",
1019
+ "/prag",
1020
  "blimp-2",
1021
  "mmlu-4"
1022
  ],
1023
  "torch_dtype": "float32",
1024
+ "transformers_version": "4.26.1",
1025
  "type_vocab_size": 0,
1026
  "vocab_size": 128100
1027
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:706433291e04d0a5099445cda6c065dc027c17490f6e29b6375f5cb2e930c24c
3
  size 1740400377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc7a150f04b55cf0740b9ab332e6adf1634b23f7bf5aab69d8f3d0c5c87e0efd
3
  size 1740400377