Spaces:

mathiaszinnen
/

odor-detection

Runtime error

odor-detection / demo-confs /models /dino_vitdet.py

Initialize app

3e99b05 over 1 year ago

1.59 kB

	from functools import partial
	import torch.nn as nn
	from detectron2.config import LazyCall as L
	from detectron2.layers import ShapeSpec
	from detectron2.modeling import ViT, SimpleFeaturePyramid
	from detectron2.modeling.backbone.fpn import LastLevelMaxPool

	from .dino_r50 import model


	# ViT Base Hyper-params
	embed_dim, depth, num_heads, dp = 768, 12, 12, 0.1

	# Creates Simple Feature Pyramid from ViT backbone
	model.backbone = L(SimpleFeaturePyramid)(
	net=L(ViT)( # Single-scale ViT backbone
	img_size=1024,
	patch_size=16,
	embed_dim=embed_dim,
	depth=depth,
	num_heads=num_heads,
	drop_path_rate=dp,
	window_size=14,
	mlp_ratio=4,
	qkv_bias=True,
	norm_layer=partial(nn.LayerNorm, eps=1e-6),
	window_block_indexes=[
	# 2, 5, 8 11 for global attention
	0,
	1,
	3,
	4,
	6,
	7,
	9,
	10,
	],
	residual_block_indexes=[],
	use_rel_pos=True,
	out_feature="last_feat",
	),
	in_feature="${.net.out_feature}",
	out_channels=256,
	scale_factors=(2.0, 1.0, 0.5), # (4.0, 2.0, 1.0, 0.5) in ViTDet
	top_block=L(LastLevelMaxPool)(),
	norm="LN",
	square_pad=1024,
	)

	# modify neck config
	model.neck.input_shapes = {
	"p3": ShapeSpec(channels=256),
	"p4": ShapeSpec(channels=256),
	"p5": ShapeSpec(channels=256),
	"p6": ShapeSpec(channels=256),
	}
	model.neck.in_features = ["p3", "p4", "p5", "p6"]
	model.neck.num_outs = 4
	model.transformer.num_feature_levels = 4