|
batch_size = 1 |
|
modelname = "groundingdino" |
|
backbone = "swin_T_224_1k" |
|
position_embedding = "sine" |
|
pe_temperatureH = 20 |
|
pe_temperatureW = 20 |
|
return_interm_indices = [1, 2, 3] |
|
backbone_freeze_keywords = None |
|
enc_layers = 6 |
|
dec_layers = 6 |
|
pre_norm = False |
|
dim_feedforward = 2048 |
|
hidden_dim = 256 |
|
dropout = 0.0 |
|
nheads = 8 |
|
num_queries = 900 |
|
query_dim = 4 |
|
num_patterns = 0 |
|
num_feature_levels = 4 |
|
enc_n_points = 4 |
|
dec_n_points = 4 |
|
two_stage_type = "standard" |
|
two_stage_bbox_embed_share = False |
|
two_stage_class_embed_share = False |
|
transformer_activation = "relu" |
|
dec_pred_bbox_embed_share = True |
|
dn_box_noise_scale = 1.0 |
|
dn_label_noise_ratio = 0.5 |
|
dn_label_coef = 1.0 |
|
dn_bbox_coef = 1.0 |
|
embed_init_tgt = True |
|
dn_labelbook_size = 2000 |
|
max_text_len = 256 |
|
text_encoder_type = "bert-base-uncased" |
|
use_text_enhancer = True |
|
use_fusion_layer = True |
|
use_checkpoint = True |
|
use_transformer_ckpt = True |
|
use_text_cross_attention = True |
|
text_dropout = 0.0 |
|
fusion_dropout = 0.0 |
|
fusion_droppath = 0.1 |
|
sub_sentence_present = True |
|
|