{
    "model_config": "",
    "checkpoint": null,
    "output_dir": "",
    "mrc_mask_prob": 0.15,
    "max_txt_len": 200,
    "train_batch_size": 32,
    "val_batch_size": 32,
    "gradient_accumulation_steps": 1,
    "learning_rate": 5e-05,
    "valid_steps": 5000,
    "log_steps": 1000,
    "num_train_steps": 100000,
    "optim": "adamw",
    "betas": [
        0.9,
        0.98
    ],
    "dropout": 0.1,
    "weight_decay": 0.01,
    "grad_norm": 5.0,
    "warmup_steps": 10000,
    "seed": 0,
    "fp16": false,
    "n_workers": 1,
    "pin_mem": true,
    "init_pretrained": "lxmert",

    "train_datasets": {
        "R4R": {
            "name": "R4R",
            "train_traj_files": ["../datasets/R4R/annotations/pretrain_map/R4R_train_enc.jsonl"],
            "val_seen_traj_files": ["../datasets/R4R/annotations/pretrain_map/R4R_val_seen_enc.jsonl"],
            "val_unseen_traj_files": ["../datasets/R4R/annotations/pretrain_map/R4R_val_unseen_sampled_enc.jsonl"],
            "connectivity_dir": "../datasets/R2R/connectivity",
            "img_ft_file": "../datasets/R2R/features/pth_vit_base_patch16_224_imagenet.hdf5",
            "scanvp_cands_file": "../datasets/R2R/annotations/scanvp_candview_relangles.json",
            "tasks": [
                "mlm",
                "sap"
            ],
            "mix_ratio": [
                1,
                1
            ]
        }
    }
}
