MogensR commited on
Commit
a543976
·
1 Parent(s): fe04664

Update Configs/sam2_hiera_large.yaml

Browse files
Files changed (1) hide show
  1. Configs/sam2_hiera_large.yaml +3 -15
Configs/sam2_hiera_large.yaml CHANGED
@@ -24,7 +24,7 @@ model:
24
  temperature: 10000
25
  d_model: 256
26
  backbone_channel_list: [1152, 576, 288, 144]
27
- fpn_top_down_levels: [2, 3] # output level 0 and 1 directly use the backbone features
28
  fpn_interp_model: nearest
29
 
30
  memory_attention:
@@ -82,36 +82,24 @@ model:
82
  kernel_size: 7
83
  padding: 3
84
  layer_scale_init_value: 1e-6
85
- use_dwconv: true # depth-wise convs
86
  num_layers: 2
87
 
88
  num_maskmem: 7
89
  image_size: 1024
90
- # apply scaled sigmoid on mask logits for memory encoder, and directly feed input mask as output mask
91
- # SAM decoder
92
  sigmoid_scale_for_mem_enc: 20.0
93
  sigmoid_bias_for_mem_enc: -10.0
94
  use_mask_input_as_output_without_sam: true
95
- # Memory
96
  directly_add_no_mem_embed: true
97
- no_obj_embed_spatial: true
98
- # use high-resolution feature map in the SAM mask decoder
99
  use_high_res_features_in_sam: true
100
- # output 3 masks on the first click on initial conditioning frames
101
  multimask_output_in_sam: true
102
- # SAM heads
103
  iou_prediction_use_sigmoid: true
104
- # cross-attend to object pointers from other frames (based on SAM output tokens) in the encoder
105
  use_obj_ptrs_in_encoder: true
106
- add_tpos_enc_to_obj_ptrs: true
107
- proj_tpos_enc_in_obj_ptrs: true
108
- use_signed_tpos_enc_to_obj_ptrs: true
109
  only_obj_ptrs_in_the_past_for_eval: true
110
- # object occlusion prediction
111
  pred_obj_scores: true
112
  pred_obj_scores_mlp: true
113
  fixed_no_obj_ptr: true
114
- # multimask tracking settings
115
  multimask_output_for_tracking: true
116
  use_multimask_token_for_obj_ptr: true
117
  multimask_min_pt_num: 0
 
24
  temperature: 10000
25
  d_model: 256
26
  backbone_channel_list: [1152, 576, 288, 144]
27
+ fpn_top_down_levels: [2, 3]
28
  fpn_interp_model: nearest
29
 
30
  memory_attention:
 
82
  kernel_size: 7
83
  padding: 3
84
  layer_scale_init_value: 1e-6
85
+ use_dwconv: true
86
  num_layers: 2
87
 
88
  num_maskmem: 7
89
  image_size: 1024
 
 
90
  sigmoid_scale_for_mem_enc: 20.0
91
  sigmoid_bias_for_mem_enc: -10.0
92
  use_mask_input_as_output_without_sam: true
 
93
  directly_add_no_mem_embed: true
 
 
94
  use_high_res_features_in_sam: true
 
95
  multimask_output_in_sam: true
 
96
  iou_prediction_use_sigmoid: true
 
97
  use_obj_ptrs_in_encoder: true
98
+ add_tpos_enc_to_obj_ptrs: false
 
 
99
  only_obj_ptrs_in_the_past_for_eval: true
 
100
  pred_obj_scores: true
101
  pred_obj_scores_mlp: true
102
  fixed_no_obj_ptr: true
 
103
  multimask_output_for_tracking: true
104
  use_multimask_token_for_obj_ptr: true
105
  multimask_min_pt_num: 0