defaults:
  - hydra: experiment
  - _self_

name: guarantees
run: main

env:
  name: simple_grid

results:
  dir: ../${env.name}/eval/${run}
  results_file: episode_returns.parquet

guarantees:
  bound: clopper-pearson # options: hoeffding, bernstein, dkw, clopper-pearson
  min_return: 0.0
  max_return: 1.0
  num_tasks: [100]
  num_episodes: [100,200,300,400,500,600,700,800,900,1000]
  beta: 1e-4 # confidence level for individual lower bounds
  delta: 1e-2 # desired overall confidence level
  step_size: 1

n_jobs: 8 # parallel jobs
