python eval.py \ --model_id="w11wo/wav2vec2-xls-r-300m-zh-HK-v2" \ --dataset="speech-recognition-community-v2/dev_data" \ --config="zh-HK" \ --split="validation" \ --text_column_name="sentence" \ --chunk_length_s="10" \ --stride_length_s="2" \ --log_outputs \ --device="0"