| { |
| "_name_or_path": "Python/ACROSS-m2o-eng-small", |
| "architectures": [ |
| "MT5ForConditionalGeneration" |
| ], |
| "consistency_loss_weight": 2.0, |
| "consistency_temperature": 1.0, |
| "contrastive": true, |
| "contrastive_mini_batch_size": 4, |
| "cross_alignment_loss_weight": 1.0, |
| "d_ff": 1024, |
| "d_kv": 64, |
| "d_model": 512, |
| "decoder_start_token_id": 0, |
| "dropout_rate": 0.1, |
| "eos_token_id": 1, |
| "feature_pooling_method": "mean_pooling", |
| "feed_forward_proj": "gated-gelu", |
| "freeze_decoder": false, |
| "freeze_mono_encoder": true, |
| "initializer_factor": 1.0, |
| "is_encoder_decoder": true, |
| "layer_norm_epsilon": 1e-06, |
| "length_penalty": 0.6, |
| "max_length": 84, |
| "model_type": "mt5", |
| "num_beams": 4, |
| "num_decoder_layers": 8, |
| "num_heads": 6, |
| "num_layers": 8, |
| "pad_token_id": 0, |
| "queue_size": 8192, |
| "relative_attention_num_buckets": 32, |
| "similarity_method": "cosine", |
| "t5_path_or_url": "output/eng2eng_small_baseline_A5000", |
| "task_specific_params": { |
| "langid_map": { |
| "amharic": [ |
| 39, |
| "\u2581<extra_id_64>" |
| ], |
| "arabic": [ |
| 8, |
| "\u2581<extra_id_95>" |
| ], |
| "azerbaijani": [ |
| 11, |
| "\u2581<extra_id_92>" |
| ], |
| "bengali": [ |
| 46, |
| "\u2581<extra_id_57>" |
| ], |
| "burmese": [ |
| 37, |
| "\u2581<extra_id_66>" |
| ], |
| "chinese_simplified": [ |
| 44, |
| "\u2581<extra_id_59>" |
| ], |
| "chinese_traditional": [ |
| 48, |
| "\u2581<extra_id_55>" |
| ], |
| "czech": [ |
| 3, |
| "\u2581<extra_id_54>" |
| ], |
| "dutch": [ |
| 1, |
| "\u2581<extra_id_52>" |
| ], |
| "english": [ |
| 34, |
| "\u2581<extra_id_69>" |
| ], |
| "french": [ |
| 14, |
| "\u2581<extra_id_89>" |
| ], |
| "german": [ |
| 0, |
| "\u2581<extra_id_51>" |
| ], |
| "gujarati": [ |
| 31, |
| "\u2581<extra_id_72>" |
| ], |
| "hausa": [ |
| 47, |
| "\u2581<extra_id_56>" |
| ], |
| "hindi": [ |
| 25, |
| "\u2581<extra_id_78>" |
| ], |
| "igbo": [ |
| 13, |
| "\u2581<extra_id_90>" |
| ], |
| "indonesian": [ |
| 5, |
| "\u2581<extra_id_98>" |
| ], |
| "italian": [ |
| 2, |
| "\u2581<extra_id_53>" |
| ], |
| "japanese": [ |
| 41, |
| "\u2581<extra_id_62>" |
| ], |
| "kirundi": [ |
| 4, |
| "\u2581<extra_id_99>" |
| ], |
| "korean": [ |
| 33, |
| "\u2581<extra_id_70>" |
| ], |
| "kyrgyz": [ |
| 9, |
| "\u2581<extra_id_94>" |
| ], |
| "marathi": [ |
| 17, |
| "\u2581<extra_id_86>" |
| ], |
| "nepali": [ |
| 24, |
| "\u2581<extra_id_79>" |
| ], |
| "oromo": [ |
| 45, |
| "\u2581<extra_id_58>" |
| ], |
| "pashto": [ |
| 38, |
| "\u2581<extra_id_65>" |
| ], |
| "persian": [ |
| 27, |
| "\u2581<extra_id_76>" |
| ], |
| "pidgin": [ |
| 18, |
| "\u2581<extra_id_85>" |
| ], |
| "portuguese": [ |
| 43, |
| "\u2581<extra_id_60>" |
| ], |
| "punjabi": [ |
| 21, |
| "\u2581<extra_id_82>" |
| ], |
| "russian": [ |
| 40, |
| "\u2581<extra_id_63>" |
| ], |
| "scottish_gaelic": [ |
| 28, |
| "\u2581<extra_id_75>" |
| ], |
| "serbian_cyrillic": [ |
| 32, |
| "\u2581<extra_id_71>" |
| ], |
| "serbian_latin": [ |
| 15, |
| "\u2581<extra_id_88>" |
| ], |
| "sinhala": [ |
| 35, |
| "\u2581<extra_id_68>" |
| ], |
| "somali": [ |
| 23, |
| "\u2581<extra_id_80>" |
| ], |
| "spanish": [ |
| 7, |
| "\u2581<extra_id_96>" |
| ], |
| "swahili": [ |
| 22, |
| "\u2581<extra_id_81>" |
| ], |
| "tamil": [ |
| 36, |
| "\u2581<extra_id_67>" |
| ], |
| "telugu": [ |
| 26, |
| "\u2581<extra_id_77>" |
| ], |
| "thai": [ |
| 10, |
| "\u2581<extra_id_93>" |
| ], |
| "tigrinya": [ |
| 20, |
| "\u2581<extra_id_83>" |
| ], |
| "turkish": [ |
| 19, |
| "\u2581<extra_id_84>" |
| ], |
| "ukrainian": [ |
| 6, |
| "\u2581<extra_id_97>" |
| ], |
| "urdu": [ |
| 42, |
| "\u2581<extra_id_61>" |
| ], |
| "uzbek": [ |
| 12, |
| "\u2581<extra_id_91>" |
| ], |
| "vietnamese": [ |
| 16, |
| "\u2581<extra_id_87>" |
| ], |
| "welsh": [ |
| 30, |
| "\u2581<extra_id_73>" |
| ], |
| "yoruba": [ |
| 29, |
| "\u2581<extra_id_74>" |
| ] |
| } |
| }, |
| "temperature": 0.1, |
| "tie_word_embeddings": false, |
| "tokenizer_class": "T5Tokenizer", |
| "use_cache": true, |
| "use_consistency_loss": true, |
| "use_cross_alignment_loss": true, |
| "use_queue_for_contrastive": true, |
| "vocab_size": 250112 |
| } |
|
|