decord==0.6.0 fairseq==0.12.2 modelscope[multi-modal]==1.3.2