command: - python3 - ${program} - --overwrite_output_dir - --freeze_feature_encoder - --gradient_checkpointing - --predict_with_generate - --fp16 - --group_by_length - --do_train - --do_eval - --load_best_model_at_end - --push_to_hub - --use_auth_token - ${args} method: grid metric: goal: maximize name: eval/bleu parameters: model_name_or_path: value: ./ task: value: covost2 language: value: fr.en eval_split_name: value: test output_dir: value: ./ num_train_epochs: value: 3 per_device_train_batch_size: value: 8 per_device_eval_batch_size: value: 8 gradient_accumulation_steps: value: 16 generation_max_length: value: 40 generation_num_beams: value: 1 learning_rate: values: - 3e-5 - 3e-4 hidden_dropout: value: 0.2 warmup_steps: value: 500 evaluation_strategy: value: steps max_duration_in_seconds: value: 20 save_steps: value: 500 eval_steps: value: 500 logging_steps: value: 1 metric_for_best_model: value: bleu greater_is_better: value: True program: run_xtreme_s.py project: xtreme_s_xlsr_2_bart_covost2_fr_en