YaTharThShaRma999
/

PromptTest

Model card Files Files and versions Community

YaTharThShaRma999 commited on Feb 11

Commit

d279346

•

1 Parent(s): fba9c83

Rename config.json to swint.py

Browse files

Files changed (2) hide show

config.json +0 -37
swint.py +118 -0

config.json DELETED Viewed

@@ -1,37 +0,0 @@
-{
-  "_name_or_path": "mistralai/Mistral-7B-v0.1",
-  "architectures": [
-    "LlavaMistralForCausalLM"
-  ],
-  "bos_token_id": 1,
-  "eos_token_id": 2,
-  "freeze_mm_mlp_adapter": false,
-  "hidden_act": "silu",
-  "hidden_size": 4096,
-  "image_aspect_ratio": "pad",
-  "image_grid_pinpoints": null,
-  "initializer_range": 0.02,
-  "intermediate_size": 14336,
-  "max_position_embeddings": 32768,
-  "mm_hidden_size": 1024,
-  "mm_projector_type": "mlp2x_gelu",
-  "mm_use_im_patch_token": false,
-  "mm_use_im_start_end": false,
-  "mm_vision_select_feature": "patch",
-  "mm_vision_select_layer": -2,
-  "mm_vision_tower": "openai/clip-vit-large-patch14-336",
-  "model_type": "llava_mistral",
-  "num_attention_heads": 32,
-  "num_hidden_layers": 32,
-  "num_key_value_heads": 8,
-  "rms_norm_eps": 1e-05,
-  "rope_theta": 10000.0,
-  "sliding_window": 4096,
-  "tie_word_embeddings": false,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.35.0.dev0",
-  "tune_mm_mlp_adapter": false,
-  "use_cache": true,
-  "use_mm_proj": true,
-  "vocab_size": 32000
-}

swint.py ADDED Viewed

	@@ -0,0 +1,118 @@

+data_aug_scales = [480, 512, 544, 576, 608, 640, 672, 704, 736, 768, 800]
+data_aug_max_size = 1333
+data_aug_scales2_resize = [400, 500, 600]
+data_aug_scales2_crop = [384, 600]
+data_aug_scale_overlap = None
+batch_size = 4
+modelname = 'groundingdino'
+backbone = 'swin_T_224_1k'
+position_embedding = 'sine'
+pe_temperatureH = 20
+pe_temperatureW = 20
+return_interm_indices = [1, 2, 3]
+enc_layers = 6
+dec_layers = 6
+pre_norm = False
+dim_feedforward = 2048
+hidden_dim = 256
+dropout = 0.0
+nheads = 8
+num_queries = 900
+query_dim = 4
+num_patterns = 0
+num_feature_levels = 4
+enc_n_points = 4
+dec_n_points = 4
+two_stage_type = 'standard'
+two_stage_bbox_embed_share = False
+two_stage_class_embed_share = False
+transformer_activation = 'relu'
+dec_pred_bbox_embed_share = True
+dn_box_noise_scale = 1.0
+dn_label_noise_ratio = 0.5
+dn_label_coef = 1.0
+dn_bbox_coef = 1.0
+embed_init_tgt = True
+dn_labelbook_size = 91
+max_text_len = 256
+text_encoder_type = "bert-base-uncased"
+use_text_enhancer = True
+use_fusion_layer = True
+use_checkpoint = True
+use_transformer_ckpt = True
+use_text_cross_attention = True
+text_dropout = 0.0
+fusion_dropout = 0.0
+fusion_droppath = 0.1
+sub_sentence_present = True
+max_labels = 50                               # pos + neg
+lr = 0.0001                                   # base learning rate
+backbone_freeze_keywords = None               # only for gdino backbone
+freeze_keywords = ['bert']                    # for whole model, e.g. ['backbone.0', 'bert'] for freeze visual encoder and text encoder
+lr_backbone = 1e-05                           # specific learning rate
+lr_backbone_names = ['backbone.0', 'bert']
+lr_linear_proj_mult = 1e-05
+lr_linear_proj_names = ['ref_point_head', 'sampling_offsets']
+weight_decay = 0.0001
+param_dict_type = 'ddetr_in_mmdet'
+ddetr_lr_param = False
+epochs = 15
+lr_drop = 4
+save_checkpoint_interval = 1
+clip_max_norm = 0.1
+onecyclelr = False
+multi_step_lr = False
+lr_drop_list = [4, 8]
+frozen_weights = None
+dilation = False
+pdetr3_bbox_embed_diff_each_layer = False
+pdetr3_refHW = -1
+random_refpoints_xy = False
+fix_refpoints_hw = -1
+dabdetr_yolo_like_anchor_update = False
+dabdetr_deformable_encoder = False
+dabdetr_deformable_decoder = False
+use_deformable_box_attn = False
+box_attn_type = 'roi_align'
+dec_layer_number = None
+decoder_layer_noise = False
+dln_xy_noise = 0.2
+dln_hw_noise = 0.2
+add_channel_attention = False
+add_pos_value = False
+two_stage_pat_embed = 0
+two_stage_add_query_num = 0
+two_stage_learn_wh = False
+two_stage_default_hw = 0.05
+two_stage_keep_all_tokens = False
+num_select = 300
+batch_norm_type = 'FrozenBatchNorm2d'
+masks = False
+aux_loss = True
+set_cost_class = 1.0
+set_cost_bbox = 5.0
+set_cost_giou = 2.0
+cls_loss_coef = 2.0
+bbox_loss_coef = 5.0
+giou_loss_coef = 2.0
+enc_loss_coef = 1.0
+interm_loss_coef = 1.0
+no_interm_box_loss = False
+mask_loss_coef = 1.0
+dice_loss_coef = 1.0
+focal_alpha = 0.25
+focal_gamma = 2.0
+decoder_sa_type = 'sa'
+matcher_type = 'HungarianMatcher'
+decoder_module_seq = ['sa', 'ca', 'ffn']
+nms_iou_threshold = -1
+dec_pred_class_embed_share = True
+match_unstable_error = True
+use_ema = False
+ema_decay = 0.9997
+ema_epoch = 0
+use_detached_boxes_dec_out = False
+use_coco_eval = True
+dn_scalar = 100