experiments_path: "./experiments/"
preds_path: "./nn_preds/"
env_path: "./envs/"
env_mask_path: "./env_masks/"
policy_folder: "./models/"
action_logs: "./action_logs/"
#########################
goal_tolerance: 0.2
n_xy_bins: 224
# n_xy_bins: 1120
n_dof_bins: 10
timeout_per_option: 10
env_name: "8"
robot:
  name: "slab"
  model_path: "simple_robot.urdf"

  # name: "turtlebot"
  # model_path: "turtlebot3_burger.urdf"
  # name: "husky"
  # model_path: "husky/husky.urdf"
  # name: "hinged"
  # model_path: "hinged_robot.urdf"
  ndofs: 3
  llimits:
    - -2.5
    - -2.5
    - -3.14
  ulimits:
    - 2.5
    - 2.5
    - 3.14
  
  # Use this for larger 25m envs

  # ndofs: 3
  # llimits:
  #   - -12.5
  #   - -12.5
  #   - -3.14
  # ulimits:
  #   - 12.5
  #   - 12.5
  #   - 3.14

mp_robot:
  # Use the puck_big if the robot is anything other 
  # than simple_robot.urdf

  name: "slab"
  model_path: "simple_puck.urdf"
  # model_path: "simple_puck_big.urdf"

  ndofs: 2
  llimits:
    - -2.5
    - -2.5
  ulimits:
    - 2.5
    - 2.5
  
  # Use this for larger 25m envs

  # ndofs: 2
  # llimits:
  #   - -12.5
  #   - -12.5
  # ulimits:
  #   - 12.5
  #   - 12.5


num_test_problems: 30
trainer_gui: False
simulator_gui: False
debug: False
eval_action_limit: 100
eval_time_limit: 100
eval_threshold: 0.71
visualize_policy: False
reset: False

region_policy:
  train_envs: 10
  warm_starts: 1000
  max_ep_len: 150
  update_batch: 150
  train_timesteps: 500000
  batch_size: 128
  train_freq: 10
  buffer_size: 1000000
  eval_time_limit: 100
  # Evaluation happens at every train_envs * eval_freq steps.
  # Set accordingly
  eval_freq: 1600

point_policy:
  train_envs: 10
  warm_starts: 1000
  max_ep_len: 150
  update_batch: 150
  train_timesteps: 160000
  batch_size: 128
  train_freq: 10
  buffer_size: 1000000
  eval_time_limit: 100
  # Evaluation happens at every train_envs * eval_freq steps.
  # Set accordingly
  eval_freq: 1600

beam_search:
  n: 40
  k: 100

HARP:
  timeout: 30
