Spaces:

Realcat
/

image-matching-webui

Running

File size: 2,807 Bytes

import torch
from fvcore.nn import FlopCountAnalysis
from einops.einops import rearrange

from src import get_model_cfg
from src.models.backbone import FPN as topicfm_featnet
from src.models.modules import TopicFormer
from src.utils.dataset import read_scannet_gray

from third_party.loftr.src.loftr.utils.cvpr_ds_config import default_cfg
from third_party.loftr.src.loftr.backbone import ResNetFPN_8_2 as loftr_featnet
from third_party.loftr.src.loftr.loftr_module import LocalFeatureTransformer


def feat_net_flops(feat_net, config, input):
    model = feat_net(config)
    model.eval()
    flops = FlopCountAnalysis(model, input)
    feat_c, _ = model(input)
    return feat_c, flops.total() / 1e9


def coarse_model_flops(coarse_model, config, inputs):
    model = coarse_model(config)
    model.eval()
    flops = FlopCountAnalysis(model, inputs)
    return flops.total() / 1e9


if __name__ == "__main__":
    path_img0 = "assets/scannet_sample_images/scene0711_00_frame-001680.jpg"
    path_img1 = "assets/scannet_sample_images/scene0711_00_frame-001995.jpg"
    img0, img1 = read_scannet_gray(path_img0), read_scannet_gray(path_img1)
    img0, img1 = img0.unsqueeze(0), img1.unsqueeze(0)

    # LoFTR
    loftr_conf = dict(default_cfg)
    feat_c0, loftr_featnet_flops0 = feat_net_flops(
        loftr_featnet, loftr_conf["resnetfpn"], img0
    )
    feat_c1, loftr_featnet_flops1 = feat_net_flops(
        loftr_featnet, loftr_conf["resnetfpn"], img1
    )
    print(
        "FLOPs of feature extraction in LoFTR: {} GFLOPs".format(
            (loftr_featnet_flops0 + loftr_featnet_flops1) / 2
        )
    )
    feat_c0 = rearrange(feat_c0, "n c h w -> n (h w) c")
    feat_c1 = rearrange(feat_c1, "n c h w -> n (h w) c")
    loftr_coarse_model_flops = coarse_model_flops(
        LocalFeatureTransformer, loftr_conf["coarse"], (feat_c0, feat_c1)
    )
    print(
        "FLOPs of coarse matching model in LoFTR: {} GFLOPs".format(
            loftr_coarse_model_flops
        )
    )

    # TopicFM
    topicfm_conf = get_model_cfg()
    feat_c0, topicfm_featnet_flops0 = feat_net_flops(
        topicfm_featnet, topicfm_conf["fpn"], img0
    )
    feat_c1, topicfm_featnet_flops1 = feat_net_flops(
        topicfm_featnet, topicfm_conf["fpn"], img1
    )
    print(
        "FLOPs of feature extraction in TopicFM: {} GFLOPs".format(
            (topicfm_featnet_flops0 + topicfm_featnet_flops1) / 2
        )
    )
    feat_c0 = rearrange(feat_c0, "n c h w -> n (h w) c")
    feat_c1 = rearrange(feat_c1, "n c h w -> n (h w) c")
    topicfm_coarse_model_flops = coarse_model_flops(
        TopicFormer, topicfm_conf["coarse"], (feat_c0, feat_c1)
    )
    print(
        "FLOPs of coarse matching model in TopicFM: {} GFLOPs".format(
            topicfm_coarse_model_flops
        )
    )