{                                                                                                     
  "model_path": "cater-cam",
  "datatype": "cater-cam",
  "dataset": "cater-cam",
  "num_workers": 16,
  "prefetch_factor": 1,
  "learning_rate": 0.0003, 
  "min_lr": 0.0001,
  "max_lr": 0.003,
  "use_cosine_annealing": false,
  "coseine_annealing_steps": 250000,
  "weight_decay": 0.001,
  "sequence_len": 24, 
  "backprop_steps": 2,
  "pretrainer_iterations": 3,
  "pretraining_mode": "mask",
  "update_interval": 1,
  "epochs": 1000,                                                                                   
  "updates": 50000000,
  "closed_loop": false,
  "teacher_forcing": 3,                                                                              
  "statistics_offset": 0,                                                                              
  "msssim": false,
  "load_optimizers": false,
  "scheduled_sampling": false,
  "world_size": 1,
  "data": {
        "train": [
            { 
                "path": "/media/chief/data/Datasets-HDF5-Compressed/CATER-CAM/CATER-train-240x320.hdf5", 
                "weight": 1.0, "split": false, "depth_weighting": false, "time_std_dev": 0, "static": false, 
                "uncertainty_regularizer": 0.05, "rgb_loss_factor": 1, "rgb_warmup": 20000, "depth_warmup": 0, "color_input": false
            }
        ],
        "val": [
            { 
                "path": "/media/chief/data/Datasets-HDF5-Compressed/CATER-CAM/CATER-val-240x320.hdf5", 
                "weight": 1.0, "split": false, "depth_weighting": false, "time_std_dev": 0, "static": false, 
                "uncertainty_regularizer": 0.05, "rgb_loss_factor": 1, "rgb_warmup": 20000, "depth_warmup": 0, "color_input": false
            }
        ],
        "test": [
            { 
                "path": "/media/chief/data/Datasets-HDF5-Compressed/CATER-CAM/CATER-test-240x320.hdf5", 
                "weight": 1.0, "split": false, "depth_weighting": false, "time_std_dev": 0, "static": false, 
                "uncertainty_regularizer": 0.05, "rgb_loss_factor": 1, "rgb_warmup": 20000, "depth_warmup": 0, "color_input": false
            }
        ] 
  },
  "model": {
        "level": 2,
        "batch_size": 32,
        "num_objects": 16,
        "img_channels": 3,
        "input_depth": false,
        "input_size": [256,  256], 
        "crop_size": [256,  256],
        "latent_size": [16, 16], 
        "vae_factor": 1e-5,
        "object_permanence_strength": 1,
        "object_regularizer": 0,
        "position_regularizer": 1,
        "time_regularizer": 1,
        "encoder_regularizer": 0.1,
        "supervision_factor": 0,
        "object_permanence_strength": 1,
        "entity_pretraining_steps": 10000000,
        "mixed_precision": false,
        "gradient_accumulation_steps": 1,
        "rgb_loss": "YCbCrL2SSIMLoss",
        "embedding": {
            "mask": { 
                "channels": 32,
                "expansion": 4
            },
            "depth": {
                "channels": 64,
                "expansion": 4
            },
            "rgb": {
                "channels": 128,
                "expansion": 4
            }
        },
        "encoder": {
            "hyper": true,
            "channels": 32,
            "blocks": [1,1,3,2],
            "hyper_channels": 256,
            "level1_channels": 32,
            "gestalt_size": 256,
            "bottleneck": "binar",
            "gestalt_frozzen": true
        },
        "predictor": {
            "heads": 2,
            "layers": 2,
            "channels_multiplier": 2,
            "reg_lambda": 1e-10,
            "gestalt_size": 256,
            "bottleneck": "binar"
        },
        "decoder": {
            "mask": {
                "pretrain_encoder_blocks": [2,4],
                "pretrain_encoder_channels": 256
            },
            "depth": {
                "layers": 3,
                "pretrain_encoder_blocks": [2,4],
                "pretrain_encoder_channels": 256
            },
            "rgb": {
                "layers": 5,
                "pretrain_encoder_blocks": [4,8],
                "pretrain_encoder_channels": 256
            }
        },
        "background": {
            "supervision_factor": 0.1,
            "uncertainty_threshold": 0.5,
            "gan_loss_pretraining": 50000000,
            "gan_loss_factor": 0.5,
            "masking_ratio": 0.75,
            "uncertainty_noise_ratio": 0.1,
            "motion_context_size": 256,
            "depth_context_size": 256,
            "latent_channels": 64,
            "num_layers": 2
        }
    }
}                          
