import os import subprocess import sys import cv2 import gdown from PIL import Image import numpy as np import streamlit as st import torch from torchvision import transforms def setup_env(path='Variations-of-SFANet-for-Crowd-Counting'): if os.path.exists(path): return path [ 'git', 'clone', f'{path}.git', f'{path}', ], capture_output=True, check=True, ) sys.path.append(path) with open(os.path.join(path, 'models', ''), 'w') as f: f.write('') return path def get_model(path, weights): from models import M_SFANet_UCF_QNRF model = M_SFANet_UCF_QNRF.Model() model.load_state_dict( torch.load(weights, map_location=torch.device('cpu'))) return model.eval() def download_weights( url='', out="Paper'", ): weights = "Paper's_weights_UCF_QNRF/best_M-SFANet*_UCF_QNRF.pth" if os.path.exists(weights): return weights, out) ['unzip', out], capture_output=True, check=True, ) return weights def transform_image(img): trans = transforms.Compose([ transforms.ToTensor(), transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]), ]) height, width = img.size[1], img.size[0] height = round(height / 16) * 16 width = round(width / 16) * 16 img = cv2.resize(np.array(img), (width, height), cv2.INTER_CUBIC) return trans(Image.fromarray(img))[None, :] def main(): st.write("Demo of [Encoder-Decoder Based Convolutional Neural Networks with Multi-Scale-Aware Modules for Crowd Counting](") # noqa path = setup_env() weights = download_weights() model = get_model(path, weights) image_file = st.file_uploader( "Upload image", type=['png', 'jpg', 'jpeg']) if image_file is not None: image ='RGB') st.image(image) density_map = model(transform_image(image)) density_map_img = density_map.detach().numpy()[0].transpose(1, 2, 0) st.image(density_map_img / density_map_img.max()) st.write("Estimated count: ", torch.sum(density_map).item()) else: st.write("Example image to use that you can drag and drop:") st.image('crowd.jpg').convert('RGB')) main()