dataset='gref_umd'

output_dir='work_dirs/Hightlighter_R50_gref_umd/'

batch_size=32
epochs=90
lr_drop=60
freeze_epochs=0
freeze_modules=['backbone', 'input_proj', 'trans_encoder', 'bert']
load_weights_path=r'pretrained_checkpoints/detr-r50-gref.pth'

model_config = dict(
    decoder=dict(
        type='Decoder',
        num_queries=1,
        query_dim=256,
        norm_dim = 256,
        return_intermediate=True,
        num_layers=6,
        layer=dict(
            type='MultiStageDecoderLayer',
            d_model=256,
            dim_feedforward=2048,
            dropout=0.,
            word_attn_args=dict(
                type='MultiheadAttention',
                embed_dim=256, num_heads=8, dropout=0.1,
            ),
            img_attn_args=dict(
                type='MultiheadAttention',
                embed_dim=256, num_heads=8, dropout=0.1,
            ),
        ),
    )
)
