{
  "IS": false,
  "cost": {
    "clamp_magnitude": 10,
    "gradient_step": 1,
    "hid_act": "relu",
    "hidden_sizes": [
      64,
      64
    ],
    "lr": 0.0001,
    "momentum": 0.9,
    "residual": false,
    "use_bn": false,
    "weight_decay": 0.001
  },
  "critic": {
    "batch_size": 800,
    "hid_act": "tanh",
    "hid_dim": 128,
    "iter": 1200,
    "lam": 0.5,
    "lr": 0.0003,
    "model_type": "resnet_disc",
    "momentum": 0.0,
    "num_layer_blocks": 3,
    "use_bn": false,
    "weight_decay": 0.0001
  },
  "cuda": -1,
  "disc": {
    "batch_size": 800,
    "clamp_magnitude": 10.0,
    "hid_act": "tanh",
    "hid_dim": 128,
    "iter": 1200,
    "lr": 0.0003,
    "model_type": "resnet_disc",
    "momentum": 0.9,
    "num_layer_blocks": 3,
    "reinit": false,
    "use_bn": false,
    "weight_decay": 0.0001
  },
  "env": {
    "T": 1000,
    "env_name": "Walker2d-v3",
    "state_indices": "all"
  },
  "experiment_tag": 32,
  "irl": {
    "eval_episodes": 20,
    "expert_episodes": 1,
    "n_itrs": 600,
    "resample_episodes": 1,
    "save_interval": 0,
    "training_trajs": 10
  },
  "obj": "maxentirl_sa",
  "reward": {
    "clamp_magnitude": 10,
    "gradient_step": 1,
    "hid_act": "relu",
    "hidden_sizes": [
      64,
      64
    ],
    "lr": 0.0001,
    "momentum": 0.9,
    "residual": false,
    "use_bn": false,
    "weight_decay": 0.001
  },
  "sac": {
    "alpha": 0.2,
    "automatic_alpha_tuning": false,
    "batch_size": 100,
    "buffer_size": 1000000,
    "epochs": 5,
    "k": 1,
    "log_step_interval": 5000,
    "lr": 0.001,
    "num_test_episodes": 10,
    "random_explore_episodes": 1,
    "reinitialize": false,
    "update_every": 1,
    "update_num": 1
  },
  "seed": 23
}