Spaces:

nebula
/

counting-anything

Runtime error

File size: 5,448 Bytes

078145b

import cv2
import argparse
import json
import numpy as np
from tqdm import tqdm
from os.path import exists
import os

from segment_anything import sam_model_registry
from automatic_mask_generator import SamAutomaticMaskGenerator
import matplotlib.pyplot as plt




parser = argparse.ArgumentParser(description="Few Shot Counting Evaluation code")
parser.add_argument("-dp", "--data_path", type=str, default='/data/counte/', help="Path to the coco dataset")
parser.add_argument("-ts", "--test_split", type=str, default='val2017', choices=["val2017"], help="what data split to evaluate on")
parser.add_argument("-mt", "--model_type", type=str, default="vit_h", help="model type")
parser.add_argument("-mp",  "--model_path", type=str, default="/home/teddy/segment-anything/sam_vit_h_4b8939.pth", help="path to trained model")
parser.add_argument("-v",  "--viz", type=bool, default=True, help="wether to visualize")
parser.add_argument("-d",   "--device", default='0', help='assign device')
args = parser.parse_args()

data_path = args.data_path
anno_file = data_path + 'annotations_trainval2017/annotations/instances_val2017.json'
im_dir = data_path + 'val2017'


if not exists(anno_file) or not exists(im_dir):
    print("Make sure you set up the --data-path correctly.")
    print("Current setting is {}, but the image dir and annotation file do not exist.".format(args.data_path))
    print("Aborting the evaluation")
    exit(-1)

def show_anns(anns):
    if len(anns) == 0:
        return
    sorted_anns = sorted(anns, key=(lambda x: x['area']), reverse=True)
    ax = plt.gca()
    ax.set_autoscale_on(False)
    for ann in sorted_anns:
        x0, y0, w, h = ann['bbox']
        ax.add_patch(plt.Rectangle((x0, y0), w, h, edgecolor='green', facecolor=(0,0,0,0), lw=2))
        ax.scatter([x0+w//2], [y0+h//2], color='green', marker='*', s=10, edgecolor='white', linewidth=1.25)


debug = True
os.environ['CUDA_VISIBLE_DEVICES'] = args.device.strip()
device = 'cuda'
sam = sam_model_registry[args.model_type](checkpoint=args.model_path)
sam.to(device=device)


mask_generator = SamAutomaticMaskGenerator(
                                model=sam,
                                min_mask_region_area=25
                                )

with open(anno_file) as f:
    annotations = json.load(f)
    
images = sorted(annotations['images'],key=lambda x:x['file_name'])

prepared_json = {}
for i in images:
    prepared_json[i['file_name']] = {
        "H":i['height'],
        "W":i['width'],
        "boxes":{},
        # "category_ids":[],
    }
for i in annotations['annotations']:
    im_id = str(i['image_id'])
    prezero = 12 - len(im_id)
    im_id = '0'*prezero + im_id + ".jpg"
    if i["category_id"] in prepared_json[im_id]["boxes"]:
        prepared_json[im_id]["boxes"][i["category_id"]].append(i['bbox'])
    else:
        prepared_json[im_id]["boxes"][i["category_id"]] = []
        prepared_json[im_id]["boxes"][i["category_id"]].append(i['bbox'])

im_ids = []
for i in prepared_json.keys():
    im_ids.append(i)


cnt = 0
folds = [
    [1,5,9,14,18,22,27,33,37,41,46,50,54,58,62,67,74,78,82,87],
    [2,6,10,15,19,23,28,34,38,42,47,51,55,59,63,70,75,79,84,88],
    [3,7,11,16,20,24,31,35,39,43,48,52,56,60,64,72,76,80,85,89],
    [4,8,13,17,21,25,32,36,40,44,49,53,57,61,65,73,77,81,86,90],
]
SAE = [0,0,0,0]  # sum of absolute errors
SSE = [0,0,0,0]  # sum of square errors

print("Evaluation on {} data".format(args.test_split))

# logs = []


pbar = tqdm(im_ids)
# err_list = []
for im_id in pbar:
    category_id = list(prepared_json[im_id]['boxes'].keys())
    
    image = cv2.imread('{}/{}'.format(im_dir, im_id))
    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    # log = []
    # log.append(im_id)
    
    for id in category_id:
        boxes = prepared_json[im_id]['boxes'][id]
        
        input_boxes = list()
        x1, y1 = boxes[0][0],boxes[0][1]
        x2, y2 = boxes[0][0] + boxes[0][2],boxes[0][1] + boxes[0][3]
        input_boxes.append([x1, y1, x2, y2])
        
        masks = mask_generator.generate(image, input_boxes)
        
        if args.viz:
            if not exists('viz'):
                os.mkdir('viz')
            plt.figure(figsize=(10,10))
            plt.imshow(image)
            show_anns(masks)
            plt.axis('off')
            plt.savefig('viz/{}_{}.jpg'.format(im_id[0:-4],id))
            plt.close()
        
        gt_cnt = len(boxes)
        pred_cnt = len(masks)
        err = abs(gt_cnt - pred_cnt)
        log.append("\n{},gt_cnt:{},pred_cnt:{}".format(id,gt_cnt,pred_cnt))
        if id in folds[0]:
            SAE[0] += err
            SSE[0] += err**2
        elif id in folds[1]:
            SAE[1] += err
            SSE[1] += err**2
        elif id in folds[2]:
            SAE[2] += err
            SSE[2] += err**2
        elif id in folds[3]: 
            SAE[3] += err
            SSE[3] += err**2

    cnt = cnt + 1
    # logs.append(log)
    pbar.set_description('fold1: {:6.2f}, fold2: {:6.2f}, fold3: {:6.2f}, fold4: {:6.2f},'.\
                        format(SAE[0]/cnt,SAE[1]/cnt,SAE[2]/cnt,SAE[3]/cnt))
    
print('On {} data, fold1 MAE: {:6.2f}, RMSE: {:6.2f}\n \
    fold2 MAE: {:6.2f}, RMSE: {:6.2f}\n \
    fold3 MAE: {:6.2f}, RMSE: {:6.2f}\n \
    fold4 MAE: {:6.2f}, RMSE: {:6.2f}\n \
    '.format(args.test_split,SAE[0]/cnt,(SSE[0]/cnt)**0.5,SAE[1]/cnt,(SSE[1]/cnt)**0.5,SAE[2]/cnt,(SSE[2]/cnt)**0.5,SAE[3]/cnt,(SSE[3]/cnt)**0.5))