diff --git a/README.md b/README.md index 9dd6fc6..2e9e931 100644 --- a/README.md +++ b/README.md @@ -108,6 +108,15 @@ We also provide a demo code to integrate Grounding DINO with Gradio Web UI. See Github link | HF link link + + 2 + GroundingDINO-B + Swin-B + COCO,O365,GoldG,Cap4M,OpenImage,OdinW-35,RefCOCO + 56.7 + Github link + link + diff --git a/groundingdino/config/GroundingDINO_SwinB.cfg.py b/groundingdino/config/GroundingDINO_SwinB.cfg.py new file mode 100644 index 0000000..f490c4b --- /dev/null +++ b/groundingdino/config/GroundingDINO_SwinB.cfg.py @@ -0,0 +1,43 @@ +batch_size = 1 +modelname = "groundingdino" +backbone = "swin_B_384_22k" +position_embedding = "sine" +pe_temperatureH = 20 +pe_temperatureW = 20 +return_interm_indices = [1, 2, 3] +backbone_freeze_keywords = None +enc_layers = 6 +dec_layers = 6 +pre_norm = False +dim_feedforward = 2048 +hidden_dim = 256 +dropout = 0.0 +nheads = 8 +num_queries = 900 +query_dim = 4 +num_patterns = 0 +num_feature_levels = 4 +enc_n_points = 4 +dec_n_points = 4 +two_stage_type = "standard" +two_stage_bbox_embed_share = False +two_stage_class_embed_share = False +transformer_activation = "relu" +dec_pred_bbox_embed_share = True +dn_box_noise_scale = 1.0 +dn_label_noise_ratio = 0.5 +dn_label_coef = 1.0 +dn_bbox_coef = 1.0 +embed_init_tgt = True +dn_labelbook_size = 2000 +max_text_len = 256 +text_encoder_type = "bert-base-uncased" +use_text_enhancer = True +use_fusion_layer = True +use_checkpoint = True +use_transformer_ckpt = True +use_text_cross_attention = True +text_dropout = 0.0 +fusion_dropout = 0.0 +fusion_droppath = 0.1 +sub_sentence_present = True