{
  "exp": "improv_radac_1",
  "device": "cuda:1",
  "env_name": "hopper-medium-expert-v2",
  "dir": "results",
  "seed": 0,
  "risky_dataset_path": "risky_d4rl/hopper_medium_expert.hdf5",
  "eval_risky_env": true,
  "use_cvar": false,
  "alpha_override": null,
  "batch_size": 256,
  "lr_decay": false,
  "early_stop": true,
  "save_best_model": true,
  "record_tensorboard": false,
  "discount": 0.99,
  "T": 5,
  "beta_schedule": "vp",
  "algo": "radac",
  "ms": "offline",
  "save_model": true,
  "output_dir": "results",
  "num_epochs": 2000,
  "eval_freq": 50,
  "eval_episodes": 10,
  "lr_actor": 0.0003,
  "lr_critic": 1e-05,
  "eta": 0.05,
  "gn": 5.0,
  "top_k": 0,
  "tau": 0.005,
  "emb_dim": 64,
  "n_quantiles": 16,
  "max_q_backup": false,
  "q_clip_range": [
    -300.0,
    300.0
  ],
  "lambda_bc": 1.0,
  "eta_warmup_steps": 300000,
  "eta_ramp_steps": 0,
  "max_vel": 2.0,
  "prob_vel_penal": 0.0,
  "cost_vel": -0.0,
  "risk_prob": 0.0,
  "risk_penalty": 0.0,
  "prob_pose_penal": 0.1,
  "cost_pose": -50.0,
  "healthy_angle_range": [
    -0.17,
    0.04
  ],
  "done_if_exceed_factor": 100.0,
  "alpha": 0.1,
  "start_steps": 1000,
  "num_steps_per_epoch": 1000,
  "flow_steps": 10,
  "version": "DDAC-vs-RADAC",
  "state_dim": 11,
  "action_dim": 3,
  "max_action": 1.0
}