{                                                                                                     
  "model_path": "sim-based",
  "datatype": "sim-based",
  "dataset": "sim-based",
  "num_workers": 4,
  "prefetch_factor": 1,
  "learning_rate": 0.00001, 
  "min_lr": 0.0001,
  "max_lr": 0.003,
  "use_cosine_annealing": false,
  "coseine_annealing_steps": 250000,
  "weight_decay": 0.001,
  "sequence_len": 24, 
  "backprop_steps": 2,
  "pretrainer_iterations": 3,
  "pretraining_mode": "all",
  "update_interval": 1,
  "epochs": 1000,                                                                                   
  "updates": 50000000,
  "closed_loop": false,
  "teacher_forcing": 10,                                                                              
  "statistics_offset": 0,                                                                              
  "msssim": false,
  "load_optimizers": false,
  "scheduled_sampling": false,
  "world_size": 1,
  "data": {
        "train": [
            { "path": "/media/chief/data/Datasets-HDF5-Compressed/Kubric-Datasets/movi-d-train-256x256.hdf5", "weight": 1.0, "split": false}
        ],
        "val": [
            { "path": "/media/chief/data/Datasets-HDF5-Compressed/Kubric-Datasets/movi-d-validation-256x256.hdf5", "weight": 1.0, "split": false}
        ],
        "test": [
            { "path": "/media/chief/data/Datasets-HDF5-Compressed/Kubric-Datasets/movi-d-test-256x256.hdf5", "weight": 1.0, "split": false}
        ] 
  },
  "model": {
        "level": 2,
        "batch_size": 3,
        "num_objects": 16,
        "img_channels": 3,
        "input_depth": false,
        "input_size": [256,  256], 
        "crop_size": [256,  256],
        "latent_size": [16, 16], 
        "vae_factor": 1e-5,
        "object_permanence_strength": 1,
        "object_regularizer": 0,
        "position_regularizer": 1,
        "time_regularizer": 1,
        "disentanglement_regularizer": 0.3,
        "encoder_regularizer": 0.1,
        "supervision_factor": 0,
        "object_permanence_strength": 1,
        "entity_pretraining_steps": 10000,
        "mixed_precision": false,
        "gradient_accumulation_steps": 1,
        "inference_mode": "regularization",
        "rgb_loss": "YCbCrL2SSIMLoss",
        "embedding": {
            "mask": { 
                "channels": 32,
                "expansion": 4
            },
            "depth": {
                "channels": 64,
                "expansion": 4
            },
            "rgb": {
                "channels": 128,
                "expansion": 4
            }
        },
        "position_proposal": {
            "channels": 64,
            "num_layers": 3
        },
        "encoder": {
            "hyper": true,
            "channels": 32,
            "blocks": [1,1,3,2],
            "hyper_channels": 256,
            "level1_channels": 32,
            "gestalt_size": 256,
            "bottleneck": "binar",
            "gestalt_frozzen": true
        },
        "predictor": {
            "heads": 1,
            "layers": 3,
            "channels": 1024,
            "reg_lambda": 1e-8,
            "gestalt_size": 256,
            "bottleneck": "binar",
            "gate": {
                "num_layers": 3,
                "num_hidden": 256,
                "reg_lambda": 1e-5,
                "noise_level": 0.1
            }
        },
        "decoder": {
            "mask": {
                "pretrain_encoder_blocks": [2,4],
                "pretrain_encoder_channels": 256
            },
            "depth": {
                "layers": 3,
                "pretrain_encoder_blocks": [2,4],
                "pretrain_encoder_channels": 256
            },
            "rgb": {
                "layers": 5,
                "pretrain_encoder_blocks": [4,8],
                "pretrain_encoder_channels": 256
            }
        },
        "background": {
            "supervision_factor": 0.1,
            "depth_weighting": false,
            "uncertainty_threshold": 0.1,
            "gan_loss_pretraining": 50000000,
            "uncertainty_warmup_steps": 3000,
            "depth_pretraining_steps":  10000,
            "gan_loss_factor": 0.5,
            "masking_ratio": 0.75,
            "uncertainty_noise_ratio": 0.1,
            "motion_context_size": 256,
            "depth_context_size": 256,
            "latent_channels": 64,
            "num_layers": 2
        }
    }
}                          
