_target_: env.GridWorld
num_rows: 3
num_cols: 7
start_state: [[1, 3]]
goal_states: [[1, 0], [1, 6]]
restart_states: None
obstructed_states: [[1, 1], [1, 5]]
bad_states: None
gamma: 0.9
p_good_transition: 0.7
transition_bias: 0.5
step_reward: 0.0
goal_reward: 0.1
bad_state_reward: 0.0
restart_state_reward: 0.0
