deepspeed run_audio_classification.py \ --deepspeed ds_config.json \ --model_name_or_path openai/whisper-medium \ --dataset_name google/xtreme_s \ --dataset_config_name fleurs.all \ --output_dir ./ \ --overwrite_output_dir \ --remove_unused_columns False \ --do_train \ --do_eval \ --fp16 \ --learning_rate 3e-5 \ --max_length_seconds 30 \ --label_column_name lang_id \ --attention_mask False \ --warmup_ratio 0.1 \ --num_train_epochs 3 \ --per_device_train_batch_size 16 \ --gradient_accumulation_steps 2 \ --gradient_checkpointing True \ --per_device_eval_batch_size 32 \ --dataloader_num_workers 8 \ --logging_strategy steps \ --logging_steps 25 \ --evaluation_strategy epoch \ --save_strategy epoch \ --load_best_model_at_end True \ --metric_for_best_model accuracy \ --seed 0 \ --freeze_feature_encoder False \ --push_to_hub