| { | |
| "adapter_layer_norm": false, | |
| "adapter_reduction_factor": 2, | |
| "adapter_reuse_layer_norm": true, | |
| "architectures": [ | |
| "XmodForMaskedLM" | |
| ], | |
| "attention_probs_dropout_prob": 0.1, | |
| "bos_token_id": 0, | |
| "eos_token_id": 2, | |
| "hidden_act": "gelu", | |
| "hidden_dropout_prob": 0.1, | |
| "hidden_size": 768, | |
| "initializer_range": 0.02, | |
| "intermediate_size": 3072, | |
| "languages": [ | |
| "en_XX", | |
| "id_ID", | |
| "vi_VN", | |
| "ru_RU", | |
| "fa_IR", | |
| "sv_SE", | |
| "ja_XX", | |
| "fr_XX", | |
| "de_DE", | |
| "ro_RO", | |
| "ko_KR", | |
| "hu_HU", | |
| "es_XX", | |
| "fi_FI", | |
| "uk_UA", | |
| "da_DK", | |
| "pt_XX", | |
| "no_XX", | |
| "th_TH", | |
| "pl_PL", | |
| "bg_BG", | |
| "nl_XX", | |
| "zh_CN", | |
| "he_IL", | |
| "el_GR", | |
| "it_IT", | |
| "sk_SK", | |
| "hr_HR", | |
| "tr_TR", | |
| "ar_AR", | |
| "cs_CZ", | |
| "lt_LT", | |
| "hi_IN", | |
| "zh_TW", | |
| "ca_ES", | |
| "ms_MY", | |
| "sl_SI", | |
| "lv_LV", | |
| "ta_IN", | |
| "bn_IN", | |
| "et_EE", | |
| "az_AZ", | |
| "sq_AL", | |
| "sr_RS", | |
| "kk_KZ", | |
| "ka_GE", | |
| "tl_XX", | |
| "ur_PK", | |
| "is_IS", | |
| "hy_AM", | |
| "ml_IN", | |
| "mk_MK", | |
| "be_BY", | |
| "la_VA", | |
| "te_IN", | |
| "eu_ES", | |
| "gl_ES", | |
| "mn_MN", | |
| "kn_IN", | |
| "ne_NP", | |
| "sw_KE", | |
| "si_LK", | |
| "mr_IN", | |
| "af_ZA", | |
| "gu_IN", | |
| "cy_GB", | |
| "eo_EO", | |
| "km_KH", | |
| "ky_KG", | |
| "uz_UZ", | |
| "ps_AF", | |
| "pa_IN", | |
| "ga_IE", | |
| "ha_NG", | |
| "am_ET", | |
| "lo_LA", | |
| "ku_TR", | |
| "so_SO", | |
| "my_MM", | |
| "or_IN", | |
| "sa_IN" | |
| ], | |
| "layer_norm_eps": 1e-05, | |
| "ln_before_adapter": true, | |
| "max_position_embeddings": 514, | |
| "model_type": "xmod", | |
| "num_attention_heads": 12, | |
| "num_hidden_layers": 12, | |
| "pad_token_id": 1, | |
| "position_embedding_type": "absolute", | |
| "pre_norm": false, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.26.0.dev0", | |
| "type_vocab_size": 1, | |
| "use_cache": true, | |
| "vocab_size": 250002 | |
| } | |