| { |
| "_name_or_path": "/kaggle/input/xsent-mdeberta-distilled/tmp/base_model", |
| "architectures": [ |
| "DebertaV2ForSequenceClassification" |
| ], |
| "attention_probs_dropout_prob": 0.1, |
| "classifiers_size": [ |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 31, |
| 12, |
| 31, |
| 11, |
| 15, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 6, |
| 6, |
| 6, |
| 2, |
| 8, |
| 10, |
| 2, |
| 2, |
| 5, |
| 2, |
| 2, |
| 2, |
| 2, |
| 1, |
| 1, |
| 1, |
| 20, |
| 235, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 1, |
| 9, |
| 17, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 18, |
| 1, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 6, |
| 5, |
| 3, |
| 1, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 60, |
| 2, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 73, |
| 113, |
| 3 |
| ], |
| "hidden_act": "gelu", |
| "hidden_dropout_prob": 0.1, |
| "hidden_size": 768, |
| "id2label": { |
| "0": "LABEL_0", |
| "1": "LABEL_1", |
| "2": "LABEL_2", |
| "3": "LABEL_3" |
| }, |
| "initializer_range": 0.02, |
| "intermediate_size": 3072, |
| "label2id": { |
| "LABEL_0": 0, |
| "LABEL_1": 1, |
| "LABEL_2": 2, |
| "LABEL_3": 3 |
| }, |
| "layer_norm_eps": 1e-07, |
| "max_position_embeddings": 512, |
| "max_relative_positions": -1, |
| "model_type": "deberta-v2", |
| "norm_rel_ebd": "layer_norm", |
| "num_attention_heads": 12, |
| "num_hidden_layers": 12, |
| "pad_token_id": 0, |
| "pooler_dropout": 0, |
| "pooler_hidden_act": "gelu", |
| "pooler_hidden_size": 768, |
| "pos_att_type": [ |
| "p2c", |
| "c2p" |
| ], |
| "position_biased_input": false, |
| "position_buckets": 256, |
| "relative_attention": true, |
| "share_att_key": true, |
| "tasks": [ |
| "multilingual-NLI-26lang-2mil7", |
| "xnli/ru", |
| "xnli/tr", |
| "xnli/ur", |
| "xnli/vi", |
| "xnli/zh", |
| "xnli/hi", |
| "xnli/fr", |
| "xnli/es", |
| "xnli/en", |
| "xnli/el", |
| "xnli/de", |
| "xnli/bg", |
| "xnli/ar", |
| "xnli/th", |
| "xnli/sw", |
| "americas_nli/all_languages", |
| "stsb_multi_mt/en", |
| "stsb_multi_mt/fr", |
| "stsb_multi_mt/de", |
| "stsb_multi_mt/es", |
| "stsb_multi_mt/it", |
| "stsb_multi_mt/nl", |
| "stsb_multi_mt/pl", |
| "stsb_multi_mt/pt", |
| "stsb_multi_mt/ru", |
| "stsb_multi_mt/zh", |
| "paws-x/zh", |
| "paws-x/ja", |
| "paws-x/ko", |
| "paws-x/en", |
| "paws-x/de", |
| "paws-x/es", |
| "paws-x/fr", |
| "miam/vm2", |
| "miam/maptask", |
| "miam/loria", |
| "miam/dihana", |
| "miam/ilisten", |
| "x-stance/fr", |
| "x-stance/de", |
| "offenseval_2020/da", |
| "offenseval_2020/tr", |
| "offenseval_2020/gr", |
| "offenseval_2020/ar", |
| "offenseval_dravidian/tamil", |
| "offenseval_dravidian/malayalam", |
| "offenseval_dravidian/kannada", |
| "xglue/qam", |
| "x-fact", |
| "xglue/nc", |
| "xglue/qadsm", |
| "xglue/qam", |
| "xglue/wpr", |
| "xlwic/xlwic_fr_fr", |
| "xlwic/xlwic_en_ko", |
| "xlwic/xlwic_it_it", |
| "xlwic/xlwic_de_de", |
| "oasst1_dense_flat/quality", |
| "oasst1_dense_flat/toxicity", |
| "oasst1_dense_flat/helpfulness", |
| "language-identification", |
| "wili_2018", |
| "exams/multilingual", |
| "xcsr/X-CSQA-ar", |
| "xcsr/X-CODAH-zh", |
| "xcsr/X-CODAH-de", |
| "xcsr/X-CSQA-ru", |
| "xcsr/X-CODAH-fr", |
| "xcsr/X-CODAH-it", |
| "xcsr/X-CODAH-jap", |
| "xcsr/X-CODAH-nl", |
| "xcsr/X-CODAH-pt", |
| "xcsr/X-CODAH-en", |
| "xcsr/X-CODAH-ru", |
| "xcsr/X-CODAH-ar", |
| "xcsr/X-CODAH-vi", |
| "xcsr/X-CODAH-hi", |
| "xcsr/X-CODAH-sw", |
| "xcsr/X-CODAH-ur", |
| "xcsr/X-CODAH-pl", |
| "xcsr/X-CSQA-ur", |
| "xcsr/X-CODAH-es", |
| "xcsr/X-CSQA-pt", |
| "xcsr/X-CSQA-vi", |
| "xcsr/X-CSQA-hi", |
| "xcsr/X-CSQA-pl", |
| "xcsr/X-CSQA-sw", |
| "xcsr/X-CSQA-nl", |
| "xcsr/X-CSQA-jap", |
| "xcsr/X-CSQA-it", |
| "xcsr/X-CSQA-es", |
| "xcsr/X-CSQA-fr", |
| "xcsr/X-CSQA-zh", |
| "xcsr/X-CSQA-en", |
| "xcsr/X-CSQA-de", |
| "xcopa/qu", |
| "xcopa/it", |
| "xcopa/ht", |
| "xcopa/et", |
| "xcopa/vi", |
| "xcopa/id", |
| "xcopa/translation-et", |
| "xcopa/th", |
| "xcopa/sw", |
| "xcopa/translation-sw", |
| "xcopa/translation-ht", |
| "xcopa/translation-it", |
| "xcopa/ta", |
| "xcopa/translation-zh", |
| "xcopa/translation-vi", |
| "xcopa/translation-id", |
| "xcopa/translation-tr", |
| "xcopa/translation-th", |
| "xcopa/translation-ta", |
| "xcopa/zh", |
| "xcopa/tr", |
| "xstory_cloze/eu", |
| "xstory_cloze/my", |
| "xstory_cloze/te", |
| "xstory_cloze/sw", |
| "xstory_cloze/en", |
| "xstory_cloze/ru", |
| "xstory_cloze/zh", |
| "xstory_cloze/es", |
| "xstory_cloze/ar", |
| "xstory_cloze/hi", |
| "xstory_cloze/id", |
| "xglue/ner", |
| "xglue/pos", |
| "universal_dependencies/sme_giella/pos", |
| "universal_dependencies/no_bokmaal/pos", |
| "universal_dependencies/no_nynorsk/pos", |
| "universal_dependencies/no_nynorsklia/pos", |
| "universal_dependencies/cu_proiel/pos", |
| "universal_dependencies/fro_srcmf/pos", |
| "universal_dependencies/orv_rnc/pos", |
| "universal_dependencies/pl_lfg/pos", |
| "universal_dependencies/otk_tonqq/pos", |
| "universal_dependencies/fa_perdt/pos", |
| "universal_dependencies/fa_seraji/pos", |
| "universal_dependencies/pcm_nsc/pos", |
| "universal_dependencies/pl_pdb/pos", |
| "universal_dependencies/pl_pud/pos", |
| "universal_dependencies/pt_bosque/pos", |
| "universal_dependencies/pt_gsd/pos", |
| "universal_dependencies/pt_pud/pos", |
| "universal_dependencies/orv_torot/pos", |
| "universal_dependencies/myu_tudet/pos", |
| "universal_dependencies/gv_cadhan/pos", |
| "universal_dependencies/gun_thomas/pos", |
| "universal_dependencies/koi_uh/pos", |
| "universal_dependencies/kpv_ikdp/pos", |
| "universal_dependencies/kpv_lattice/pos", |
| "universal_dependencies/ko_gsd/pos", |
| "universal_dependencies/ko_kaist/pos", |
| "universal_dependencies/ko_pud/pos", |
| "universal_dependencies/kmr_mg/pos", |
| "universal_dependencies/la_ittb/pos", |
| "universal_dependencies/la_llct/pos", |
| "universal_dependencies/la_perseus/pos", |
| "universal_dependencies/la_proiel/pos", |
| "universal_dependencies/lv_lvtb/pos", |
| "universal_dependencies/lt_alksnis/pos", |
| "universal_dependencies/lt_hse/pos", |
| "universal_dependencies/olo_kkpp/pos", |
| "universal_dependencies/mt_mudt/pos", |
| "universal_dependencies/ro_nonstandard/pos", |
| "universal_dependencies/mr_ufal/pos", |
| "universal_dependencies/gun_dooley/pos", |
| "universal_dependencies/mdf_jr/pos", |
| "universal_dependencies/ro_rrt/pos", |
| "universal_dependencies/ru_taiga/pos", |
| "universal_dependencies/ru_gsd/pos", |
| "universal_dependencies/ta_mwtt/pos", |
| "universal_dependencies/ta_ttb/pos", |
| "universal_dependencies/te_mtg/pos", |
| "universal_dependencies/th_pud/pos", |
| "universal_dependencies/qtd_sagt/pos", |
| "universal_dependencies/tr_boun/pos", |
| "universal_dependencies/tr_gb/pos", |
| "universal_dependencies/tr_imst/pos", |
| "universal_dependencies/tr_pud/pos", |
| "universal_dependencies/uk_iu/pos", |
| "universal_dependencies/hsb_ufal/pos", |
| "universal_dependencies/ur_udtb/pos", |
| "universal_dependencies/ug_udt/pos", |
| "universal_dependencies/vi_vtb/pos", |
| "universal_dependencies/wbp_ufal/pos", |
| "universal_dependencies/cy_ccg/pos", |
| "universal_dependencies/wo_wtb/pos", |
| "universal_dependencies/yo_ytb/pos", |
| "universal_dependencies/tl_ugnayan/pos", |
| "universal_dependencies/ro_simonero/pos", |
| "universal_dependencies/tl_trg/pos", |
| "universal_dependencies/sv_talbanken/pos", |
| "universal_dependencies/ru_pud/pos", |
| "universal_dependencies/ru_syntagrus/pos", |
| "universal_dependencies/sa_ufal/pos", |
| "universal_dependencies/sa_vedic/pos", |
| "universal_dependencies/gd_arcosg/pos", |
| "universal_dependencies/sr_set/pos", |
| "universal_dependencies/sms_giellagas/pos", |
| "universal_dependencies/sk_snk/pos", |
| "universal_dependencies/sl_ssj/pos", |
| "universal_dependencies/sl_sst/pos", |
| "universal_dependencies/ajp_madar/pos", |
| "universal_dependencies/es_ancora/pos", |
| "universal_dependencies/es_gsd/pos", |
| "universal_dependencies/es_pud/pos", |
| "universal_dependencies/swl_sslc/pos", |
| "universal_dependencies/sv_lines/pos", |
| "universal_dependencies/sv_pud/pos", |
| "universal_dependencies/gsw_uzh/pos", |
| "universal_dependencies/kk_ktb/pos", |
| "universal_dependencies/hi_hdtb/pos", |
| "universal_dependencies/ja_pud/pos", |
| "universal_dependencies/zh_gsd/pos", |
| "universal_dependencies/zh_gsdsimp/pos", |
| "universal_dependencies/zh_hk/pos", |
| "universal_dependencies/zh_pud/pos", |
| "universal_dependencies/ckt_hse/pos", |
| "universal_dependencies/lzh_kyoto/pos", |
| "universal_dependencies/cop_scriptorium/pos", |
| "universal_dependencies/hr_set/pos", |
| "universal_dependencies/cs_cac/pos", |
| "universal_dependencies/cs_cltt/pos", |
| "universal_dependencies/cs_fictree/pos", |
| "universal_dependencies/cs_pdt/pos", |
| "universal_dependencies/cs_pud/pos", |
| "universal_dependencies/da_ddt/pos", |
| "universal_dependencies/nl_alpino/pos", |
| "universal_dependencies/nl_lassysmall/pos", |
| "universal_dependencies/en_esl/pos", |
| "universal_dependencies/en_ewt/pos", |
| "universal_dependencies/en_gum/pos", |
| "universal_dependencies/zh_cfl/pos", |
| "universal_dependencies/ca_ancora/pos", |
| "universal_dependencies/yue_hk/pos", |
| "universal_dependencies/bxr_bdt/pos", |
| "universal_dependencies/af_afribooms/pos", |
| "universal_dependencies/krl_kkpp/pos", |
| "universal_dependencies/akk_riao/pos", |
| "universal_dependencies/aqz_tudet/pos", |
| "universal_dependencies/sq_tsa/pos", |
| "universal_dependencies/am_att/pos", |
| "universal_dependencies/grc_perseus/pos", |
| "universal_dependencies/grc_proiel/pos", |
| "universal_dependencies/apu_ufpa/pos", |
| "universal_dependencies/en_gumreddit/pos", |
| "universal_dependencies/ar_nyuad/pos", |
| "universal_dependencies/ar_pud/pos", |
| "universal_dependencies/hy_armtdp/pos", |
| "universal_dependencies/aii_as/pos", |
| "universal_dependencies/bm_crb/pos", |
| "universal_dependencies/eu_bdt/pos", |
| "universal_dependencies/be_hse/pos", |
| "universal_dependencies/bho_bhtb/pos", |
| "universal_dependencies/br_keb/pos", |
| "universal_dependencies/bg_btb/pos", |
| "universal_dependencies/ar_padt/pos", |
| "universal_dependencies/en_lines/pos", |
| "universal_dependencies/akk_pisandub/pos", |
| "universal_dependencies/en_pronouns/pos", |
| "universal_dependencies/el_gdt/pos", |
| "universal_dependencies/he_htb/pos", |
| "universal_dependencies/qhe_hiencs/pos", |
| "universal_dependencies/hi_pud/pos", |
| "universal_dependencies/hu_szeged/pos", |
| "universal_dependencies/is_icepahc/pos", |
| "universal_dependencies/id_csui/pos", |
| "universal_dependencies/id_gsd/pos", |
| "universal_dependencies/id_pud/pos", |
| "universal_dependencies/ga_idt/pos", |
| "universal_dependencies/it_isdt/pos", |
| "universal_dependencies/it_partut/pos", |
| "universal_dependencies/it_postwita/pos", |
| "universal_dependencies/it_pud/pos", |
| "universal_dependencies/it_twittiro/pos", |
| "universal_dependencies/it_vit/pos", |
| "universal_dependencies/ja_bccwj/pos", |
| "universal_dependencies/ja_gsd/pos", |
| "universal_dependencies/ja_modern/pos", |
| "universal_dependencies/got_proiel/pos", |
| "universal_dependencies/de_pud/pos", |
| "universal_dependencies/is_pud/pos", |
| "universal_dependencies/de_hdt/pos", |
| "universal_dependencies/en_pud/pos", |
| "universal_dependencies/myv_jr/pos", |
| "universal_dependencies/de_lit/pos", |
| "universal_dependencies/et_ewt/pos", |
| "universal_dependencies/fo_farpahc/pos", |
| "universal_dependencies/fo_oft/pos", |
| "universal_dependencies/fi_ftb/pos", |
| "universal_dependencies/fi_ood/pos", |
| "universal_dependencies/fi_pud/pos", |
| "universal_dependencies/fi_tdt/pos", |
| "universal_dependencies/et_edt/pos", |
| "universal_dependencies/fr_ftb/pos", |
| "universal_dependencies/fr_fqb/pos", |
| "universal_dependencies/de_gsd/pos", |
| "universal_dependencies/gl_treegal/pos", |
| "universal_dependencies/gl_ctg/pos", |
| "universal_dependencies/fr_spoken/pos", |
| "universal_dependencies/en_partut/pos", |
| "universal_dependencies/fr_pud/pos", |
| "universal_dependencies/fr_partut/pos", |
| "universal_dependencies/fr_sequoia/pos", |
| "universal_dependencies/fr_gsd/pos", |
| "oasst1_pairwise_rlhf_reward", |
| "multilingual-sentiments/all", |
| "tweet_sentiment_multilingual/arabic", |
| "tweet_sentiment_multilingual/french", |
| "tweet_sentiment_multilingual/english", |
| "tweet_sentiment_multilingual/hindi", |
| "tweet_sentiment_multilingual/portuguese", |
| "tweet_sentiment_multilingual/spanish", |
| "tweet_sentiment_multilingual/all", |
| "tweet_sentiment_multilingual/german", |
| "tweet_sentiment_multilingual/italian", |
| "amazon_reviews_multi/all_languages", |
| "universal-joy", |
| "mms", |
| "ACES", |
| "massive/my-MM", |
| "massive/ro-RO", |
| "massive/pt-PT", |
| "massive/pl-PL", |
| "massive/nl-NL", |
| "massive/nb-NO", |
| "massive/es-ES", |
| "massive/ms-MY", |
| "massive/mn-MN", |
| "massive/ml-IN", |
| "massive/lv-LV", |
| "massive/ko-KR", |
| "massive/ru-RU", |
| "massive/kn-IN", |
| "massive/ka-GE", |
| "massive/jv-ID", |
| "massive/ja-JP", |
| "massive/it-IT", |
| "massive/is-IS", |
| "massive/id-ID", |
| "massive/hy-AM", |
| "massive/hu-HU", |
| "massive/hi-IN", |
| "massive/he-IL", |
| "massive/fr-FR", |
| "massive/km-KH", |
| "massive/fi-FI", |
| "massive/sl-SL", |
| "massive/sv-SE", |
| "massive/af-ZA", |
| "massive/am-ET", |
| "massive/ar-SA", |
| "massive/az-AZ", |
| "massive/bn-BD", |
| "massive/ca-ES", |
| "massive/cy-GB", |
| "massive/da-DK", |
| "massive/de-DE", |
| "massive/el-GR", |
| "massive/sq-AL", |
| "massive/en-US", |
| "massive/all", |
| "massive/zh-TW", |
| "massive/zh-CN", |
| "massive/vi-VN", |
| "massive/ur-PK", |
| "massive/tr-TR", |
| "massive/tl-PH", |
| "massive/th-TH", |
| "massive/te-IN", |
| "massive/ta-IN", |
| "massive/sw-KE", |
| "massive/all_1.1", |
| "massive/fa-IR", |
| "tydi-as2-balanced", |
| "multiconer_v2/Hindi (HI)", |
| "multiconer_v2/Multilingual (MULTI)", |
| "multiconer_v2/Ukrainian (UK)", |
| "multiconer_v2/Swedish (SV)", |
| "multiconer_v2/Spanish (ES)", |
| "multiconer_v2/Bangla (BN)", |
| "multiconer_v2/Chinese (ZH)", |
| "multiconer_v2/English (EN)", |
| "multiconer_v2/Farsi (FA)", |
| "multiconer_v2/Portuguese (PT)", |
| "multiconer_v2/German (DE)", |
| "multiconer_v2/Italian (IT)", |
| "multiconer_v2/French (FR)", |
| "mtop", |
| "multilingual-zero-shot-label-nli" |
| ], |
| "torch_dtype": "float32", |
| "transformers_version": "4.31.0", |
| "type_vocab_size": 0, |
| "vocab_size": 251000 |
| } |
|
|