timm==0.4.12 fairscale==0.4.4 pycocoevalcap torch torchvision Pillow transformers[sentencepiece]