Xsent-mDeberta-v3-base / config.json
HasinMDG's picture
Upload DebertaV2ForSequenceClassification
9654050
{
"_name_or_path": "/kaggle/input/xsent-mdeberta-distilled/tmp/base_model",
"architectures": [
"DebertaV2ForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifiers_size": [
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
2,
2,
2,
2,
2,
2,
2,
31,
12,
31,
11,
15,
2,
2,
2,
2,
2,
2,
6,
6,
6,
2,
8,
10,
2,
2,
5,
2,
2,
2,
2,
1,
1,
1,
20,
235,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
9,
17,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
1,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
6,
5,
3,
1,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
60,
2,
73,
73,
73,
73,
73,
73,
73,
73,
73,
73,
73,
73,
73,
113,
3
],
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1",
"2": "LABEL_2",
"3": "LABEL_3"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2,
"LABEL_3": 3
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"norm_rel_ebd": "layer_norm",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 768,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"position_buckets": 256,
"relative_attention": true,
"share_att_key": true,
"tasks": [
"multilingual-NLI-26lang-2mil7",
"xnli/ru",
"xnli/tr",
"xnli/ur",
"xnli/vi",
"xnli/zh",
"xnli/hi",
"xnli/fr",
"xnli/es",
"xnli/en",
"xnli/el",
"xnli/de",
"xnli/bg",
"xnli/ar",
"xnli/th",
"xnli/sw",
"americas_nli/all_languages",
"stsb_multi_mt/en",
"stsb_multi_mt/fr",
"stsb_multi_mt/de",
"stsb_multi_mt/es",
"stsb_multi_mt/it",
"stsb_multi_mt/nl",
"stsb_multi_mt/pl",
"stsb_multi_mt/pt",
"stsb_multi_mt/ru",
"stsb_multi_mt/zh",
"paws-x/zh",
"paws-x/ja",
"paws-x/ko",
"paws-x/en",
"paws-x/de",
"paws-x/es",
"paws-x/fr",
"miam/vm2",
"miam/maptask",
"miam/loria",
"miam/dihana",
"miam/ilisten",
"x-stance/fr",
"x-stance/de",
"offenseval_2020/da",
"offenseval_2020/tr",
"offenseval_2020/gr",
"offenseval_2020/ar",
"offenseval_dravidian/tamil",
"offenseval_dravidian/malayalam",
"offenseval_dravidian/kannada",
"xglue/qam",
"x-fact",
"xglue/nc",
"xglue/qadsm",
"xglue/qam",
"xglue/wpr",
"xlwic/xlwic_fr_fr",
"xlwic/xlwic_en_ko",
"xlwic/xlwic_it_it",
"xlwic/xlwic_de_de",
"oasst1_dense_flat/quality",
"oasst1_dense_flat/toxicity",
"oasst1_dense_flat/helpfulness",
"language-identification",
"wili_2018",
"exams/multilingual",
"xcsr/X-CSQA-ar",
"xcsr/X-CODAH-zh",
"xcsr/X-CODAH-de",
"xcsr/X-CSQA-ru",
"xcsr/X-CODAH-fr",
"xcsr/X-CODAH-it",
"xcsr/X-CODAH-jap",
"xcsr/X-CODAH-nl",
"xcsr/X-CODAH-pt",
"xcsr/X-CODAH-en",
"xcsr/X-CODAH-ru",
"xcsr/X-CODAH-ar",
"xcsr/X-CODAH-vi",
"xcsr/X-CODAH-hi",
"xcsr/X-CODAH-sw",
"xcsr/X-CODAH-ur",
"xcsr/X-CODAH-pl",
"xcsr/X-CSQA-ur",
"xcsr/X-CODAH-es",
"xcsr/X-CSQA-pt",
"xcsr/X-CSQA-vi",
"xcsr/X-CSQA-hi",
"xcsr/X-CSQA-pl",
"xcsr/X-CSQA-sw",
"xcsr/X-CSQA-nl",
"xcsr/X-CSQA-jap",
"xcsr/X-CSQA-it",
"xcsr/X-CSQA-es",
"xcsr/X-CSQA-fr",
"xcsr/X-CSQA-zh",
"xcsr/X-CSQA-en",
"xcsr/X-CSQA-de",
"xcopa/qu",
"xcopa/it",
"xcopa/ht",
"xcopa/et",
"xcopa/vi",
"xcopa/id",
"xcopa/translation-et",
"xcopa/th",
"xcopa/sw",
"xcopa/translation-sw",
"xcopa/translation-ht",
"xcopa/translation-it",
"xcopa/ta",
"xcopa/translation-zh",
"xcopa/translation-vi",
"xcopa/translation-id",
"xcopa/translation-tr",
"xcopa/translation-th",
"xcopa/translation-ta",
"xcopa/zh",
"xcopa/tr",
"xstory_cloze/eu",
"xstory_cloze/my",
"xstory_cloze/te",
"xstory_cloze/sw",
"xstory_cloze/en",
"xstory_cloze/ru",
"xstory_cloze/zh",
"xstory_cloze/es",
"xstory_cloze/ar",
"xstory_cloze/hi",
"xstory_cloze/id",
"xglue/ner",
"xglue/pos",
"universal_dependencies/sme_giella/pos",
"universal_dependencies/no_bokmaal/pos",
"universal_dependencies/no_nynorsk/pos",
"universal_dependencies/no_nynorsklia/pos",
"universal_dependencies/cu_proiel/pos",
"universal_dependencies/fro_srcmf/pos",
"universal_dependencies/orv_rnc/pos",
"universal_dependencies/pl_lfg/pos",
"universal_dependencies/otk_tonqq/pos",
"universal_dependencies/fa_perdt/pos",
"universal_dependencies/fa_seraji/pos",
"universal_dependencies/pcm_nsc/pos",
"universal_dependencies/pl_pdb/pos",
"universal_dependencies/pl_pud/pos",
"universal_dependencies/pt_bosque/pos",
"universal_dependencies/pt_gsd/pos",
"universal_dependencies/pt_pud/pos",
"universal_dependencies/orv_torot/pos",
"universal_dependencies/myu_tudet/pos",
"universal_dependencies/gv_cadhan/pos",
"universal_dependencies/gun_thomas/pos",
"universal_dependencies/koi_uh/pos",
"universal_dependencies/kpv_ikdp/pos",
"universal_dependencies/kpv_lattice/pos",
"universal_dependencies/ko_gsd/pos",
"universal_dependencies/ko_kaist/pos",
"universal_dependencies/ko_pud/pos",
"universal_dependencies/kmr_mg/pos",
"universal_dependencies/la_ittb/pos",
"universal_dependencies/la_llct/pos",
"universal_dependencies/la_perseus/pos",
"universal_dependencies/la_proiel/pos",
"universal_dependencies/lv_lvtb/pos",
"universal_dependencies/lt_alksnis/pos",
"universal_dependencies/lt_hse/pos",
"universal_dependencies/olo_kkpp/pos",
"universal_dependencies/mt_mudt/pos",
"universal_dependencies/ro_nonstandard/pos",
"universal_dependencies/mr_ufal/pos",
"universal_dependencies/gun_dooley/pos",
"universal_dependencies/mdf_jr/pos",
"universal_dependencies/ro_rrt/pos",
"universal_dependencies/ru_taiga/pos",
"universal_dependencies/ru_gsd/pos",
"universal_dependencies/ta_mwtt/pos",
"universal_dependencies/ta_ttb/pos",
"universal_dependencies/te_mtg/pos",
"universal_dependencies/th_pud/pos",
"universal_dependencies/qtd_sagt/pos",
"universal_dependencies/tr_boun/pos",
"universal_dependencies/tr_gb/pos",
"universal_dependencies/tr_imst/pos",
"universal_dependencies/tr_pud/pos",
"universal_dependencies/uk_iu/pos",
"universal_dependencies/hsb_ufal/pos",
"universal_dependencies/ur_udtb/pos",
"universal_dependencies/ug_udt/pos",
"universal_dependencies/vi_vtb/pos",
"universal_dependencies/wbp_ufal/pos",
"universal_dependencies/cy_ccg/pos",
"universal_dependencies/wo_wtb/pos",
"universal_dependencies/yo_ytb/pos",
"universal_dependencies/tl_ugnayan/pos",
"universal_dependencies/ro_simonero/pos",
"universal_dependencies/tl_trg/pos",
"universal_dependencies/sv_talbanken/pos",
"universal_dependencies/ru_pud/pos",
"universal_dependencies/ru_syntagrus/pos",
"universal_dependencies/sa_ufal/pos",
"universal_dependencies/sa_vedic/pos",
"universal_dependencies/gd_arcosg/pos",
"universal_dependencies/sr_set/pos",
"universal_dependencies/sms_giellagas/pos",
"universal_dependencies/sk_snk/pos",
"universal_dependencies/sl_ssj/pos",
"universal_dependencies/sl_sst/pos",
"universal_dependencies/ajp_madar/pos",
"universal_dependencies/es_ancora/pos",
"universal_dependencies/es_gsd/pos",
"universal_dependencies/es_pud/pos",
"universal_dependencies/swl_sslc/pos",
"universal_dependencies/sv_lines/pos",
"universal_dependencies/sv_pud/pos",
"universal_dependencies/gsw_uzh/pos",
"universal_dependencies/kk_ktb/pos",
"universal_dependencies/hi_hdtb/pos",
"universal_dependencies/ja_pud/pos",
"universal_dependencies/zh_gsd/pos",
"universal_dependencies/zh_gsdsimp/pos",
"universal_dependencies/zh_hk/pos",
"universal_dependencies/zh_pud/pos",
"universal_dependencies/ckt_hse/pos",
"universal_dependencies/lzh_kyoto/pos",
"universal_dependencies/cop_scriptorium/pos",
"universal_dependencies/hr_set/pos",
"universal_dependencies/cs_cac/pos",
"universal_dependencies/cs_cltt/pos",
"universal_dependencies/cs_fictree/pos",
"universal_dependencies/cs_pdt/pos",
"universal_dependencies/cs_pud/pos",
"universal_dependencies/da_ddt/pos",
"universal_dependencies/nl_alpino/pos",
"universal_dependencies/nl_lassysmall/pos",
"universal_dependencies/en_esl/pos",
"universal_dependencies/en_ewt/pos",
"universal_dependencies/en_gum/pos",
"universal_dependencies/zh_cfl/pos",
"universal_dependencies/ca_ancora/pos",
"universal_dependencies/yue_hk/pos",
"universal_dependencies/bxr_bdt/pos",
"universal_dependencies/af_afribooms/pos",
"universal_dependencies/krl_kkpp/pos",
"universal_dependencies/akk_riao/pos",
"universal_dependencies/aqz_tudet/pos",
"universal_dependencies/sq_tsa/pos",
"universal_dependencies/am_att/pos",
"universal_dependencies/grc_perseus/pos",
"universal_dependencies/grc_proiel/pos",
"universal_dependencies/apu_ufpa/pos",
"universal_dependencies/en_gumreddit/pos",
"universal_dependencies/ar_nyuad/pos",
"universal_dependencies/ar_pud/pos",
"universal_dependencies/hy_armtdp/pos",
"universal_dependencies/aii_as/pos",
"universal_dependencies/bm_crb/pos",
"universal_dependencies/eu_bdt/pos",
"universal_dependencies/be_hse/pos",
"universal_dependencies/bho_bhtb/pos",
"universal_dependencies/br_keb/pos",
"universal_dependencies/bg_btb/pos",
"universal_dependencies/ar_padt/pos",
"universal_dependencies/en_lines/pos",
"universal_dependencies/akk_pisandub/pos",
"universal_dependencies/en_pronouns/pos",
"universal_dependencies/el_gdt/pos",
"universal_dependencies/he_htb/pos",
"universal_dependencies/qhe_hiencs/pos",
"universal_dependencies/hi_pud/pos",
"universal_dependencies/hu_szeged/pos",
"universal_dependencies/is_icepahc/pos",
"universal_dependencies/id_csui/pos",
"universal_dependencies/id_gsd/pos",
"universal_dependencies/id_pud/pos",
"universal_dependencies/ga_idt/pos",
"universal_dependencies/it_isdt/pos",
"universal_dependencies/it_partut/pos",
"universal_dependencies/it_postwita/pos",
"universal_dependencies/it_pud/pos",
"universal_dependencies/it_twittiro/pos",
"universal_dependencies/it_vit/pos",
"universal_dependencies/ja_bccwj/pos",
"universal_dependencies/ja_gsd/pos",
"universal_dependencies/ja_modern/pos",
"universal_dependencies/got_proiel/pos",
"universal_dependencies/de_pud/pos",
"universal_dependencies/is_pud/pos",
"universal_dependencies/de_hdt/pos",
"universal_dependencies/en_pud/pos",
"universal_dependencies/myv_jr/pos",
"universal_dependencies/de_lit/pos",
"universal_dependencies/et_ewt/pos",
"universal_dependencies/fo_farpahc/pos",
"universal_dependencies/fo_oft/pos",
"universal_dependencies/fi_ftb/pos",
"universal_dependencies/fi_ood/pos",
"universal_dependencies/fi_pud/pos",
"universal_dependencies/fi_tdt/pos",
"universal_dependencies/et_edt/pos",
"universal_dependencies/fr_ftb/pos",
"universal_dependencies/fr_fqb/pos",
"universal_dependencies/de_gsd/pos",
"universal_dependencies/gl_treegal/pos",
"universal_dependencies/gl_ctg/pos",
"universal_dependencies/fr_spoken/pos",
"universal_dependencies/en_partut/pos",
"universal_dependencies/fr_pud/pos",
"universal_dependencies/fr_partut/pos",
"universal_dependencies/fr_sequoia/pos",
"universal_dependencies/fr_gsd/pos",
"oasst1_pairwise_rlhf_reward",
"multilingual-sentiments/all",
"tweet_sentiment_multilingual/arabic",
"tweet_sentiment_multilingual/french",
"tweet_sentiment_multilingual/english",
"tweet_sentiment_multilingual/hindi",
"tweet_sentiment_multilingual/portuguese",
"tweet_sentiment_multilingual/spanish",
"tweet_sentiment_multilingual/all",
"tweet_sentiment_multilingual/german",
"tweet_sentiment_multilingual/italian",
"amazon_reviews_multi/all_languages",
"universal-joy",
"mms",
"ACES",
"massive/my-MM",
"massive/ro-RO",
"massive/pt-PT",
"massive/pl-PL",
"massive/nl-NL",
"massive/nb-NO",
"massive/es-ES",
"massive/ms-MY",
"massive/mn-MN",
"massive/ml-IN",
"massive/lv-LV",
"massive/ko-KR",
"massive/ru-RU",
"massive/kn-IN",
"massive/ka-GE",
"massive/jv-ID",
"massive/ja-JP",
"massive/it-IT",
"massive/is-IS",
"massive/id-ID",
"massive/hy-AM",
"massive/hu-HU",
"massive/hi-IN",
"massive/he-IL",
"massive/fr-FR",
"massive/km-KH",
"massive/fi-FI",
"massive/sl-SL",
"massive/sv-SE",
"massive/af-ZA",
"massive/am-ET",
"massive/ar-SA",
"massive/az-AZ",
"massive/bn-BD",
"massive/ca-ES",
"massive/cy-GB",
"massive/da-DK",
"massive/de-DE",
"massive/el-GR",
"massive/sq-AL",
"massive/en-US",
"massive/all",
"massive/zh-TW",
"massive/zh-CN",
"massive/vi-VN",
"massive/ur-PK",
"massive/tr-TR",
"massive/tl-PH",
"massive/th-TH",
"massive/te-IN",
"massive/ta-IN",
"massive/sw-KE",
"massive/all_1.1",
"massive/fa-IR",
"tydi-as2-balanced",
"multiconer_v2/Hindi (HI)",
"multiconer_v2/Multilingual (MULTI)",
"multiconer_v2/Ukrainian (UK)",
"multiconer_v2/Swedish (SV)",
"multiconer_v2/Spanish (ES)",
"multiconer_v2/Bangla (BN)",
"multiconer_v2/Chinese (ZH)",
"multiconer_v2/English (EN)",
"multiconer_v2/Farsi (FA)",
"multiconer_v2/Portuguese (PT)",
"multiconer_v2/German (DE)",
"multiconer_v2/Italian (IT)",
"multiconer_v2/French (FR)",
"mtop",
"multilingual-zero-shot-label-nli"
],
"torch_dtype": "float32",
"transformers_version": "4.31.0",
"type_vocab_size": 0,
"vocab_size": 251000
}