python eval.py \ | |
--model_id="w11wo/wav2vec2-xls-r-300m-zh-HK-lm-v2" \ | |
--dataset="speech-recognition-community-v2/dev_data" \ | |
--config="zh-HK" \ | |
--split="validation" \ | |
--text_column_name="sentence" \ | |
--chunk_length_s="10" \ | |
--stride_length_s="2" \ | |
--log_outputs \ | |
--device="0" |