Update Configs/sam2_hiera_large.yaml
Browse files
Configs/sam2_hiera_large.yaml
CHANGED
|
@@ -24,7 +24,7 @@ model:
|
|
| 24 |
temperature: 10000
|
| 25 |
d_model: 256
|
| 26 |
backbone_channel_list: [1152, 576, 288, 144]
|
| 27 |
-
fpn_top_down_levels: [2, 3]
|
| 28 |
fpn_interp_model: nearest
|
| 29 |
|
| 30 |
memory_attention:
|
|
@@ -82,36 +82,24 @@ model:
|
|
| 82 |
kernel_size: 7
|
| 83 |
padding: 3
|
| 84 |
layer_scale_init_value: 1e-6
|
| 85 |
-
use_dwconv: true
|
| 86 |
num_layers: 2
|
| 87 |
|
| 88 |
num_maskmem: 7
|
| 89 |
image_size: 1024
|
| 90 |
-
# apply scaled sigmoid on mask logits for memory encoder, and directly feed input mask as output mask
|
| 91 |
-
# SAM decoder
|
| 92 |
sigmoid_scale_for_mem_enc: 20.0
|
| 93 |
sigmoid_bias_for_mem_enc: -10.0
|
| 94 |
use_mask_input_as_output_without_sam: true
|
| 95 |
-
# Memory
|
| 96 |
directly_add_no_mem_embed: true
|
| 97 |
-
no_obj_embed_spatial: true
|
| 98 |
-
# use high-resolution feature map in the SAM mask decoder
|
| 99 |
use_high_res_features_in_sam: true
|
| 100 |
-
# output 3 masks on the first click on initial conditioning frames
|
| 101 |
multimask_output_in_sam: true
|
| 102 |
-
# SAM heads
|
| 103 |
iou_prediction_use_sigmoid: true
|
| 104 |
-
# cross-attend to object pointers from other frames (based on SAM output tokens) in the encoder
|
| 105 |
use_obj_ptrs_in_encoder: true
|
| 106 |
-
add_tpos_enc_to_obj_ptrs:
|
| 107 |
-
proj_tpos_enc_in_obj_ptrs: true
|
| 108 |
-
use_signed_tpos_enc_to_obj_ptrs: true
|
| 109 |
only_obj_ptrs_in_the_past_for_eval: true
|
| 110 |
-
# object occlusion prediction
|
| 111 |
pred_obj_scores: true
|
| 112 |
pred_obj_scores_mlp: true
|
| 113 |
fixed_no_obj_ptr: true
|
| 114 |
-
# multimask tracking settings
|
| 115 |
multimask_output_for_tracking: true
|
| 116 |
use_multimask_token_for_obj_ptr: true
|
| 117 |
multimask_min_pt_num: 0
|
|
|
|
| 24 |
temperature: 10000
|
| 25 |
d_model: 256
|
| 26 |
backbone_channel_list: [1152, 576, 288, 144]
|
| 27 |
+
fpn_top_down_levels: [2, 3]
|
| 28 |
fpn_interp_model: nearest
|
| 29 |
|
| 30 |
memory_attention:
|
|
|
|
| 82 |
kernel_size: 7
|
| 83 |
padding: 3
|
| 84 |
layer_scale_init_value: 1e-6
|
| 85 |
+
use_dwconv: true
|
| 86 |
num_layers: 2
|
| 87 |
|
| 88 |
num_maskmem: 7
|
| 89 |
image_size: 1024
|
|
|
|
|
|
|
| 90 |
sigmoid_scale_for_mem_enc: 20.0
|
| 91 |
sigmoid_bias_for_mem_enc: -10.0
|
| 92 |
use_mask_input_as_output_without_sam: true
|
|
|
|
| 93 |
directly_add_no_mem_embed: true
|
|
|
|
|
|
|
| 94 |
use_high_res_features_in_sam: true
|
|
|
|
| 95 |
multimask_output_in_sam: true
|
|
|
|
| 96 |
iou_prediction_use_sigmoid: true
|
|
|
|
| 97 |
use_obj_ptrs_in_encoder: true
|
| 98 |
+
add_tpos_enc_to_obj_ptrs: false
|
|
|
|
|
|
|
| 99 |
only_obj_ptrs_in_the_past_for_eval: true
|
|
|
|
| 100 |
pred_obj_scores: true
|
| 101 |
pred_obj_scores_mlp: true
|
| 102 |
fixed_no_obj_ptr: true
|
|
|
|
| 103 |
multimask_output_for_tracking: true
|
| 104 |
use_multimask_token_for_obj_ptr: true
|
| 105 |
multimask_min_pt_num: 0
|