{ "_name_or_path": "microsoft/mdeberta-v3-base", "architectures": [ "DebertaV2ForSequenceClassification" ], "attention_probs_dropout_prob": 0.1, "classifiers_size": [ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 15, 31, 12, 31, 11, 2, 2, 3, 5, 6, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 6, 6, 6, 69, 2, 1, 8, 10, 2, 2, 5, 2, 2, 2, 2, 1, 1, 1, 20, 235, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 9, 17, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 1 ], "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "entailment", "1": "neutral", "2": "contradiction" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "contradiction": 2, "entailment": 0, "neutral": 1 }, "layer_norm_eps": 1e-07, "max_position_embeddings": 512, "max_relative_positions": -1, "model_type": "deberta-v2", "norm_rel_ebd": "layer_norm", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 0, "pooler_dropout": 0, "pooler_hidden_act": "gelu", "pooler_hidden_size": 768, "pos_att_type": [ "p2c", "c2p" ], "position_biased_input": false, "position_buckets": 256, "relative_attention": true, "share_att_key": true, "tasks": [ "xnli/es", "xnli/ar", "xnli/bg", "xnli/de", "xnli/el", "xnli/en", "xnli/fr", "xnli/hi", "xnli/ru", "xnli/sw", "xnli/th", "xnli/tr", "xnli/ur", "xnli/vi", "xnli/zh", "americas_nli/all_languages", "multilingual-NLI-26lang-2mil7", "stsb_multi_mt/zh", "stsb_multi_mt/pt", "stsb_multi_mt/pl", "stsb_multi_mt/nl", "stsb_multi_mt/it", "stsb_multi_mt/fr", "stsb_multi_mt/es", "stsb_multi_mt/de", "stsb_multi_mt/en", "stsb_multi_mt/ru", "paws-x/ko", "paws-x/zh", "paws-x/fr", "paws-x/es", "paws-x/de", "paws-x/en", "paws-x/ja", "miam/ilisten", "miam/vm2", "miam/maptask", "miam/loria", "miam/dihana", "x-stance/fr", "x-stance/de", "multilingual-sentiments/all", "universal-joy", "amazon_reviews_multi/all_languages", "tweet_sentiment_multilingual/all", "tweet_sentiment_multilingual/spanish", "tweet_sentiment_multilingual/portuguese", "tweet_sentiment_multilingual/italian", "tweet_sentiment_multilingual/arabic", "tweet_sentiment_multilingual/german", "tweet_sentiment_multilingual/french", "tweet_sentiment_multilingual/english", "tweet_sentiment_multilingual/hindi", "offenseval_2020/da", "offenseval_2020/gr", "offenseval_2020/tr", "offenseval_2020/ar", "offenseval_dravidian/tamil", "offenseval_dravidian/malayalam", "offenseval_dravidian/kannada", "MLMA_hate_speech", "xglue/qam", "xsum_factuality", "x-fact", "xglue/nc", "xglue/qadsm", "xglue/qam", "xglue/wpr", "xlwic/xlwic_de_de", "xlwic/xlwic_fr_fr", "xlwic/xlwic_en_ko", "xlwic/xlwic_it_it", "oasst1_dense_flat/quality", "oasst1_dense_flat/toxicity", "oasst1_dense_flat/helpfulness", "language-identification", "wili_2018", "exams/multilingual", "xcsr/X-CODAH-en", "xcsr/X-CSQA-ur", "xcsr/X-CSQA-sw", "xcsr/X-CSQA-hi", "xcsr/X-CSQA-vi", "xcsr/X-CSQA-ar", "xcsr/X-CSQA-ru", "xcsr/X-CSQA-jap", "xcsr/X-CSQA-nl", "xcsr/X-CODAH-zh", "xcsr/X-CSQA-it", "xcsr/X-CSQA-fr", "xcsr/X-CSQA-es", "xcsr/X-CSQA-de", "xcsr/X-CSQA-zh", "xcsr/X-CSQA-en", "xcsr/X-CSQA-pl", "xcsr/X-CODAH-de", "xcsr/X-CSQA-pt", "xcsr/X-CODAH-fr", "xcsr/X-CODAH-es", "xcsr/X-CODAH-ur", "xcsr/X-CODAH-sw", "xcsr/X-CODAH-hi", "xcsr/X-CODAH-ar", "xcsr/X-CODAH-vi", "xcsr/X-CODAH-pt", "xcsr/X-CODAH-pl", "xcsr/X-CODAH-nl", "xcsr/X-CODAH-jap", "xcsr/X-CODAH-it", "xcsr/X-CODAH-ru", "xcopa/ta", "xcopa/vi", "xcopa/tr", "xcopa/th", "xcopa/zh", "xcopa/et", "xcopa/qu", "xcopa/id", "xcopa/it", "xcopa/ht", "xcopa/translation-et", "xcopa/sw", "xcopa/translation-ht", "xcopa/translation-th", "xcopa/translation-id", "xcopa/translation-sw", "xcopa/translation-zh", "xcopa/translation-ta", "xcopa/translation-tr", "xcopa/translation-vi", "xcopa/translation-it", "xstory_cloze/id", "xstory_cloze/hi", "xstory_cloze/ar", "xstory_cloze/es", "xstory_cloze/en", "xstory_cloze/ru", "xstory_cloze/te", "xstory_cloze/sw", "xstory_cloze/zh", "xstory_cloze/eu", "xstory_cloze/my", "hh-rlhf", "xglue/ner", "xglue/pos", "universal_dependencies/ja_gsd/pos", "universal_dependencies/fr_pud/pos", "universal_dependencies/fr_partut/pos", "universal_dependencies/fr_gsd/pos", "universal_dependencies/fr_ftb/pos", "universal_dependencies/fr_fqb/pos", "universal_dependencies/fi_tdt/pos", "universal_dependencies/fi_pud/pos", "universal_dependencies/fi_ood/pos", "universal_dependencies/fi_ftb/pos", "universal_dependencies/fo_oft/pos", "universal_dependencies/fo_farpahc/pos", "universal_dependencies/et_ewt/pos", "universal_dependencies/et_edt/pos", "universal_dependencies/myv_jr/pos", "universal_dependencies/en_pud/pos", "universal_dependencies/en_pronouns/pos", "universal_dependencies/en_partut/pos", "universal_dependencies/fr_sequoia/pos", "universal_dependencies/fr_spoken/pos", "universal_dependencies/gl_ctg/pos", "universal_dependencies/gl_treegal/pos", "universal_dependencies/it_postwita/pos", "universal_dependencies/it_partut/pos", "universal_dependencies/it_isdt/pos", "universal_dependencies/ga_idt/pos", "universal_dependencies/id_pud/pos", "universal_dependencies/id_gsd/pos", "universal_dependencies/id_csui/pos", "universal_dependencies/is_pud/pos", "universal_dependencies/is_icepahc/pos", "universal_dependencies/en_lines/pos", "universal_dependencies/hu_szeged/pos", "universal_dependencies/hi_hdtb/pos", "universal_dependencies/qhe_hiencs/pos", "universal_dependencies/he_htb/pos", "universal_dependencies/el_gdt/pos", "universal_dependencies/got_proiel/pos", "universal_dependencies/de_pud/pos", "universal_dependencies/de_lit/pos", "universal_dependencies/de_hdt/pos", "universal_dependencies/de_gsd/pos", "universal_dependencies/hi_pud/pos", "universal_dependencies/en_gumreddit/pos", "universal_dependencies/en_ewt/pos", "universal_dependencies/it_pud/pos", "universal_dependencies/bho_bhtb/pos", "universal_dependencies/be_hse/pos", "universal_dependencies/eu_bdt/pos", "universal_dependencies/bm_crb/pos", "universal_dependencies/aii_as/pos", "universal_dependencies/hy_armtdp/pos", "universal_dependencies/ar_pud/pos", "universal_dependencies/ar_padt/pos", "universal_dependencies/br_keb/pos", "universal_dependencies/ar_nyuad/pos", "universal_dependencies/grc_proiel/pos", "universal_dependencies/grc_perseus/pos", "universal_dependencies/am_att/pos", "universal_dependencies/sq_tsa/pos", "universal_dependencies/aqz_tudet/pos", "universal_dependencies/akk_riao/pos", "universal_dependencies/akk_pisandub/pos", "universal_dependencies/af_afribooms/pos", "universal_dependencies/apu_ufpa/pos", "universal_dependencies/bg_btb/pos", "universal_dependencies/bxr_bdt/pos", "universal_dependencies/yue_hk/pos", "universal_dependencies/en_esl/pos", "universal_dependencies/nl_lassysmall/pos", "universal_dependencies/nl_alpino/pos", "universal_dependencies/da_ddt/pos", "universal_dependencies/cs_pud/pos", "universal_dependencies/cs_pdt/pos", "universal_dependencies/cs_fictree/pos", "universal_dependencies/cs_cltt/pos", "universal_dependencies/cs_cac/pos", "universal_dependencies/hr_set/pos", "universal_dependencies/cop_scriptorium/pos", "universal_dependencies/lzh_kyoto/pos", "universal_dependencies/ckt_hse/pos", "universal_dependencies/zh_pud/pos", "universal_dependencies/zh_hk/pos", "universal_dependencies/zh_gsdsimp/pos", "universal_dependencies/zh_gsd/pos", "universal_dependencies/zh_cfl/pos", "universal_dependencies/ca_ancora/pos", "universal_dependencies/en_gum/pos", "universal_dependencies/ja_bccwj/pos", "universal_dependencies/it_twittiro/pos", "universal_dependencies/wo_wtb/pos", "universal_dependencies/gun_thomas/pos", "universal_dependencies/mdf_jr/pos", "universal_dependencies/myu_tudet/pos", "universal_dependencies/pcm_nsc/pos", "universal_dependencies/nyq_aha/pos", "universal_dependencies/sme_giella/pos", "universal_dependencies/no_bokmaal/pos", "universal_dependencies/no_nynorsk/pos", "universal_dependencies/no_nynorsklia/pos", "universal_dependencies/cu_proiel/pos", "universal_dependencies/fro_srcmf/pos", "universal_dependencies/orv_rnc/pos", "universal_dependencies/orv_torot/pos", "universal_dependencies/otk_tonqq/pos", "universal_dependencies/fa_perdt/pos", "universal_dependencies/fa_seraji/pos", "universal_dependencies/pl_lfg/pos", "universal_dependencies/pl_pdb/pos", "universal_dependencies/pl_pud/pos", "universal_dependencies/gun_dooley/pos", "universal_dependencies/mr_ufal/pos", "universal_dependencies/it_vit/pos", "universal_dependencies/mt_mudt/pos", "universal_dependencies/ja_modern/pos", "universal_dependencies/ja_pud/pos", "universal_dependencies/krl_kkpp/pos", "universal_dependencies/kk_ktb/pos", "universal_dependencies/kfm_aha/pos", "universal_dependencies/koi_uh/pos", "universal_dependencies/kpv_ikdp/pos", "universal_dependencies/kpv_lattice/pos", "universal_dependencies/ko_gsd/pos", "universal_dependencies/pt_bosque/pos", "universal_dependencies/ko_kaist/pos", "universal_dependencies/kmr_mg/pos", "universal_dependencies/la_ittb/pos", "universal_dependencies/la_llct/pos", "universal_dependencies/la_perseus/pos", "universal_dependencies/la_proiel/pos", "universal_dependencies/lv_lvtb/pos", "universal_dependencies/lt_alksnis/pos", "universal_dependencies/lt_hse/pos", "universal_dependencies/olo_kkpp/pos", "universal_dependencies/ko_pud/pos", "universal_dependencies/yo_ytb/pos", "universal_dependencies/pt_gsd/pos", "universal_dependencies/ro_nonstandard/pos", "universal_dependencies/tl_trg/pos", "universal_dependencies/tl_ugnayan/pos", "universal_dependencies/ta_mwtt/pos", "universal_dependencies/ta_ttb/pos", "universal_dependencies/te_mtg/pos", "universal_dependencies/th_pud/pos", "universal_dependencies/tpn_tudet/pos", "universal_dependencies/qtd_sagt/pos", "universal_dependencies/tr_boun/pos", "universal_dependencies/tr_gb/pos", "universal_dependencies/tr_imst/pos", "universal_dependencies/tr_pud/pos", "universal_dependencies/uk_iu/pos", "universal_dependencies/hsb_ufal/pos", "universal_dependencies/ur_udtb/pos", "universal_dependencies/ug_udt/pos", "universal_dependencies/vi_vtb/pos", "universal_dependencies/wbp_ufal/pos", "universal_dependencies/cy_ccg/pos", "universal_dependencies/gsw_uzh/pos", "universal_dependencies/pt_pud/pos", "universal_dependencies/sv_talbanken/pos", "universal_dependencies/sv_lines/pos", "universal_dependencies/ro_rrt/pos", "universal_dependencies/ro_simonero/pos", "universal_dependencies/ru_gsd/pos", "universal_dependencies/ru_pud/pos", "universal_dependencies/ru_syntagrus/pos", "universal_dependencies/ru_taiga/pos", "universal_dependencies/sa_ufal/pos", "universal_dependencies/sa_vedic/pos", "universal_dependencies/gd_arcosg/pos", "universal_dependencies/sv_pud/pos", "universal_dependencies/sr_set/pos", "universal_dependencies/sk_snk/pos", "universal_dependencies/sl_ssj/pos", "universal_dependencies/sl_sst/pos", "universal_dependencies/soj_aha/pos", "universal_dependencies/ajp_madar/pos", "universal_dependencies/es_ancora/pos", "universal_dependencies/es_gsd/pos", "universal_dependencies/es_pud/pos", "universal_dependencies/swl_sslc/pos", "universal_dependencies/sms_giellagas/pos", "universal_dependencies/gv_cadhan/pos", "oasst1_pairwise_rlhf_reward" ], "torch_dtype": "float32", "transformers_version": "4.26.1", "type_vocab_size": 0, "vocab_size": 251000 }