command: | |
- python3 | |
- ${program} | |
- --streaming | |
- ${args} | |
method: grid | |
metric: | |
goal: minimize | |
name: tedlium-long-form/validation/wer | |
parameters: | |
model_name_or_path: | |
value: sanchit-gandhi/large-32-2-ts-freeze-28k-wer-10 | |
subfolder: | |
value: checkpoint-15000 | |
dataset_name: | |
value: distil-whisper/tedlium-long-form | |
dataset_config_name: | |
value: all | |
dataset_split_name: | |
value: validation | |
cache_dir: | |
value: /home/sanchitgandhi/.cache | |
dataset_cache_dir: | |
value: /home/sanchitgandhi/.cache | |
compilation_cache: | |
value: /home/sanchitgandhi/.cache | |
output_dir: | |
value: ./ | |
wandb_dir: | |
value: /home/sanchitgandhi/.cache | |
per_device_eval_batch_size: | |
value: 8 | |
dtype: | |
value: bfloat16 | |
report_to: | |
value: wandb | |
chunk_length_s: | |
values: | |
- 10 | |
- 15 | |
- 20 | |
- 25 | |
- 30 | |
generation_max_length: | |
value: 128 | |
program: run_long_form_transcription.py | |
project: distil-whisper-long-form |