romman8's picture
add: training_parameter.json for reproducability
14a044f
{
"ppo_config": {
"model_name": "R-best-fine-tuned-bart-base-full-ft-reward_short_sentences_and_words-2023-07-13T06-49-08",
"steps": 20000,
"note": "Stopped manually after 65 steps",
"learning_rate": 1e-06,
"target": 6,
"batch_size": 64,
"mini_batch_size": 1,
"ppo_epochs": 4,
"gradient_accumulation_steps": 1,
"log_with": "tensorboard",
"accelerator_kwargs": {
"logging_dir": "/content/results/R-best-fine-tuned-bart-base-full-ft-reward_short_sentences_and_words-2023-07-13T06-49-08/runs"
},
"early_stopping": false,
"push_to_hub_if_best_kwargs": {
"repo_id": "nlp-lab-2023-seq2seq/R-best-fine-tuned-bart-base-full-ft-reward_short_sentences_and_words-2023-07-13T06-49-08",
"private": true,
"commit_message": "add: new best model"
},
"compare_steps": 100
},
"generation_kwargs": {
"max_new_tokens": 414,
"num_beams": 1,
"early_stopping": true,
"pad_token_id": 1,
"eos_token_id": 2
},
"translation_model": "nlp-lab-2023-seq2seq/R-facebook-bart-base-full-ft-without-tum-nlp-german-gpt2_easy-prior-pp-bb5c579f",
"reward_fn": "reward_bleu_short_sentences_and_words",
"finetuning_strategy": "full"
}