wandb_version: 1 | |
eval_split_name: | |
value: test | |
eval_steps: | |
value: 500 | |
evaluation_strategy: | |
value: steps | |
generation_max_length: | |
value: 40 | |
generation_num_beams: | |
value: 1 | |
gradient_accumulation_steps: | |
value: 8 | |
greater_is_better: | |
value: true | |
hidden_dropout: | |
value: 0.18004101365999406 | |
language: | |
value: fr.en | |
learning_rate: | |
value: 0.0002757119755681108 | |
logging_steps: | |
value: 1 | |
max_duration_in_seconds: | |
value: 20 | |
metric_for_best_model: | |
value: bleu | |
model_name_or_path: | |
value: ./ | |
num_train_epochs: | |
value: 3 | |
output_dir: | |
value: ./ | |
per_device_eval_batch_size: | |
value: 8 | |
per_device_train_batch_size: | |
value: 8 | |
save_steps: | |
value: 500 | |
task: | |
value: covost2 | |
warmup_steps: | |
value: 500 | |