timm==0.4.12 transformers==4.15.0 fairscale==0.4.4 tokenizers==0.10.1 pycocoevalcap torch==1.13.1 torchvision==0.14.1 Pillow