{                                                                                                     
  "model_path": "kitti_256_bg",
  "datatype": "kitti-simple",                                                                         
  "dataset": "kitti_256-v3",                                                                         
  "frame_skip": 2,
  "num_workers": 8,
  "prefetch_factor": 1,
  "learning_rate": 0.0001, 
  "sequence_len": 30, 
  "backprop_steps": 3,
  "update_interval": 1,
  "epochs": 1000,                                                                                   
  "updates": 50000000,
  "closed_loop": false,
  "teacher_forcing": 0,                                                                              
  "statistics_offset": 0,                                                                              
  "msssim": false,
  "load_optimizers": false,
  "scheduled_sampling": false,
  "trainig_mode": "background_depth",
  "model": {
        "level": 2,
        "batch_size": 32,
        "num_objects": 10,
        "img_channels": 3,
        "input_size": [256,  832], 
        "latent_size": [16, 52], 
        "vae_factor": 1e-5,
        "object_permanence_strength": 1,
        "object_regularizer": 1,
        "position_regularizer": 1,
        "time_regularizer": 1,
        "warmup_regularizer": 100,
        "unmasked_regularizer": 0.1,
        "encoder_regularizer": 0.1,
        "supervision_factor": 0,
        "object_permanence_strength": 1,
        "entity_pretraining_steps": 3000000,
        "pretraining_steps": 0,
        "uncertainty_warmup_steps": 250000,
        "rgb_loss_factor": 0.01,
        "depth_weighting": true,
        "gan_loss_pretraining": 500000,
        "gan_loss_factor": 0.5,
        "encoder": {
            "channels": 64,
            "level1_channels": 32,
            "num_layers": 3,
            "gestalt_size": 128,
            "bottleneck": "binar"
        },
        "predictor": {
            "heads": 2,
            "layers": 2,
            "channels_multiplier": 2,
            "reg_lambda": 1e-10,
            "gestalt_size": 128,
            "bottleneck": "binar"
        },
        "decoder": {
            "channels": 32,
            "num_layers": 2
        },
        "background": {
            "learning_rate": 0.0001, 
            "num_layers": 3, 
            "reg_lambda": 1e-10,
            "num_embedding_layers": 0,
            "num_attention_layers": 3,
            "num_hyper_layers": 3,
            "num_hyper_channels": 96,
            "num_heads": 3,
            "uncertainty_base_channels": 16,
            "uncertainty_blocks": [1,2,3,4],
            "uncertainty_threshold": 0.1,
            "uncertainty_regularizer": 0.05,
            "depth_input": true,
            "channels": 48,
            "use": true
        }
    }
}                          
