env_name: CustomReacherEnv-v0
rewards:
  - ground_truth
  - ground_truth_shaping
policy:
  checkpoint_filepath: ???
  config_filepath: ???
policy_evaluation:
  num_training_steps: ???
  num_evaluation_steps: 1000000
output_dir: ???
