{
    "model_config": "",
    "checkpoint": null,
    "output_dir": "",
    "mrc_mask_prob": 0.15,
    "max_txt_len": 200,
    "train_batch_size": 16,
    "val_batch_size": 16,
    "gradient_accumulation_steps": 1,
    "learning_rate": 5e-05,
    "valid_steps": 2500,
    "log_steps": 1000,
    "num_train_steps": 200000,
    "optim": "adamw",
    "betas": [
        0.9,
        0.98
    ],
    "dropout": 0.1,
    "weight_decay": 0.01,
    "grad_norm": 5.0,
    "warmup_steps": 10000,
    "seed": 0,
    "fp16": false,
    "n_workers": 1,
    "pin_mem": true,
    "init_pretrained": "lxmert",

    "train_datasets": {
        "R2R": {
            "name": "R2R",
            "train_traj_files": ["../datasets/R2R/annotations/pretrain_map/R2R_train_enc.jsonl",
                                "../datasets/R2R/annotations/pretrain_map/R2R_prevalent_aug_train_enc.jsonl"],
            "val_seen_traj_files": ["../datasets/R2R/annotations/pretrain_map/R2R_val_seen_enc.jsonl"],
            "val_unseen_traj_files": ["../datasets/R2R/annotations/pretrain_map/R2R_val_unseen_enc.jsonl"],
            "connectivity_dir": "../datasets/R2R/connectivity",
            "img_ft_file": "../datasets/R2R/features/clip_vit-b16_mp3d_original.hdf5",
            "scanvp_cands_file": "../datasets/R2R/annotations/scanvp_candview_relangles.json",
            "tasks": [
                "mlm",
                "mrc",
                "sap"
            ],
            "mix_ratio": [
                1,
                1,
                1
            ]
        }
    }
}
