experiments_path: "./experiments"
preds_path: "./nn_preds/"
env_path: "./envs/"
env_mask_path: "./env_masks/"
policy_folder: "./models/"
action_logs: "./action_logs/"
policy_logs: "./policy_logs/"
results_folder: "results/"
#########################
goal_tolerance: 0.2
n_xy_bins: 224
# n_xy_bins: 1120
n_dof_bins: 10
timeout_per_option: 10
criticality_threshold: 0.6
env_name: "8_small"
robot:
  # name: "slab"
  # model_path: "simple_robot.urdf"

  # name: "turtlebot"
  # model_path: "turtlebot3_burger.urdf"
  # name: "husky"
  # model_path: "husky/husky.urdf"

  name: "limo"
  model_path: "limo/limo.urdf"


  # name: "hinged"
  # model_path: "hinged_robot.urdf"
  # ndofs: 3
  # llimits:
  #   - -7.5
  #   - -7.5
  #   - -3.14
  # ulimits:
  #   - 7.5
  #   - 7.5
  #   - 3.14

  ndofs: 3
  llimits:
    - -2.5
    - -2.5
    - -3.14
  ulimits:
    - 2.5
    - 2.5
    - 3.14


  # ndofs: 4
  # llimits:
  #   - -2.5
  #   - -2.5
  #   - -3.14
  #   - -1.57
  # ulimits:
  #   - 2.5
  #   - 2.5
  #   - 3.14
  #   - 1.57
  # ndofs: 3
  # llimits:
  #   - -12.5
  #   - -12.5
  #   - -3.14
  # ulimits:
  #   - 12.5
  #   - 12.5
  #   - 3.14

mp_robot:
  name: "slab"
  # model_path: "simple_puck.urdf"
  # model_path: "simple_robot.urdf"
  model_path: "simple_robot_small.urdf"


  ndofs: 3
  llimits:
    - -7.5
    - -7.5
    - -3.14
  ulimits:
    - 7.5
    - 7.5
    - 3.14
  # ndofs: 2
  # llimits:
  #   - -12.5
  #   - -12.5
  # ulimits:
  #   - 12.5
  #   - 12.5

  # name: "hinged"
  # model_path: "hinged_robot.urdf"

  # ndofs: 4
  # llimits:
  #   - -2.5
  #   - -2.5
  #   - -3.14
  #   - -1.57
  # ulimits:
  #   - 2.5
  #   - 2.5
  #   - 3.14
  #   - 1.57

  
# LL control params
# Working config: 20 environments; 350000 train_timesteps; 150 update_batch
# Scale environment and train timesteps together
#
num_test_problems: 5
trainer_gui: True
mp_gui: False
simulator_gui: False
debug: False
eval_action_limit: 100
eval_time_limit: 100
eval_threshold: 0.71
visualize_policy: False
reset: True

region_policy:
  train_envs: 1
  warm_starts: 1000
  max_ep_len: 150
  update_batch: -1
  train_timesteps: 150000
  batch_size: 128
  train_freq: 15
  buffer_size: 1000000
  eval_time_limit: 100
  eval_freq: 1000

point_policy:
  train_envs: 1
  warm_starts: 1000
  max_ep_len: 150
  update_batch: -1
  train_timesteps: 150000
  batch_size: 128
  train_freq: 10
  buffer_size: 1000000
  eval_time_limit: 100
  eval_freq: 1000

beam_search:
  n: 40
  k: 100

HARP:
  timeout: 30
