[input] modality=video v_fps=30 [model] v_fps=25 model_path=benchmarks/CMUMOSEAS/models/pt/CMUMOSEAS_V_PT_WER51.4/model.pth model_conf=benchmarks/CMUMOSEAS/models/pt/CMUMOSEAS_V_PT_WER51.4/model.json rnnlm=benchmarks/CMUMOSEAS/language_models/pt/lm_pt/model.pth rnnlm_conf=benchmarks/CMUMOSEAS/language_models/pt/lm_pt/model.json [decode] beam_size=30 penalty=0.0 maxlenratio=0.0 minlenratio=0.0 ctc_weight=0.1 lm_weight=0.3