defaults:
  - base_dataset

grid_size: 5
start_positions: 
  - [0, 0]
  - [4, 0]
goal_positions: 
  - [4, 4]
  - [0, 4]
noise_scale: 0.12
n_simulation_steps: 12
Kp: 1.0
Kd: 0.3
episode_len: 50
action_dim: 2
repeat_observation: ${algorithm.repeat_observation}

env_id: 'diagonal2d-v0'
gamma: 1.0 
observation_mean: [1.9999, 2.0151]
observation_std: [1.1742, 1.1665]
action_mean: [-0.0048,  0.0797]
action_std: [0.1052, 0.0684]
reward_mean: 0.0402
reward_std: 0.1964
