|
{ |
|
"exp_name":"mt_enfrde", |
|
"exp_id":"demo", |
|
"dump_path":"/content/dump_path", |
|
"encoder_only":"False", |
|
"data_path":"/content/processed", |
|
"lgs":"de-en-fr", |
|
"clm_steps":"", |
|
"mlm_steps":"", |
|
"mt_steps":"...", |
|
"ae_steps":"", |
|
"bt_steps":"", |
|
"pc_steps":"", |
|
"reload_emb":"", |
|
"reload_model":"/content/dump_path/mlm_enfrde/demo/best-valid_mlm_ppl.pth,/content/dump_path/mlm_enfrde/demo/best-valid_mlm_ppl.pth", |
|
"reload_checkpoint":"", |
|
"epoch_size":"100", |
|
"max_epoch":"1", |
|
"stopping_criterion":"valid_en-fr_mt_bleu,10", |
|
"validation_metrics":"valid_en-fr_mt_bleu", |
|
"train_n_samples":"-1", |
|
"valid_n_samples":"-1", |
|
"test_n_samples":"-1", |
|
"remove_long_sentences_train":"False", |
|
"remove_long_sentences_valid":"False", |
|
"remove_long_sentences_test":"False", |
|
|
|
"eval_bleu":"True", |
|
"eval_only":"False", |
|
"max_len":"100", |
|
"group_by_size":"True", |
|
"batch_size":"32", |
|
"save_periodic":"0", |
|
"fp16":"False", |
|
"amp":"-1", |
|
"emb_dim":"1024", |
|
"n_layers":"6", |
|
"n_heads":"8", |
|
"dropout":"0.1", |
|
"attention_dropout":"0.1", |
|
"gelu_activation":"True", |
|
"share_inout_emb":"True", |
|
"sinusoidal_embeddings":"False", |
|
"use_lang_emb":"True", |
|
"use_memory":"False", |
|
"asm":"False", |
|
"context_size":"0", |
|
"word_pred":"0.15", |
|
"word_mask_keep_rand":"0.8,0.1,0.1", |
|
"word_shuffle":"3", |
|
"word_dropout":"0.1", |
|
"word_blank":"0.1", |
|
"max_vocab":"-1", |
|
"min_count":"0", |
|
"lg_sampling_factor":"-1", |
|
"bptt":"256", |
|
"max_batch_size":"0", |
|
"tokens_per_batch":"2000", |
|
"split_data":"False", |
|
"optimizer":"adam_inverse_sqrt,beta1=0.9,beta2=0.98,lr=0.0001", |
|
"clip_grad_norm":"5", |
|
"accumulate_gradients":"1", |
|
"lambda_mlm":"1", |
|
"lambda_clm":"1", |
|
"lambda_pc":"1", |
|
"lambda_ae":"0:1,100000:0.1,300000:0", |
|
"lambda_mt":"1", |
|
"lambda_bt":"1", |
|
"beam_size":"1", |
|
"length_penalty":"1", |
|
"early_stopping":"False", |
|
"debug_train":"False", |
|
"debug_slurm":"False", |
|
"local_rank":"-1", |
|
"master_port":"-1", |
|
"mem_enc_positions":"", |
|
"mem_dec_positions":"", |
|
"asm_cutoffs":"8000,20000", |
|
"asm_div_value":"4" |
|
} |