progress_bar: True
log_weights: false
log_interval: 512
optim_steps_per_batch: 1
num_eval_rollouts: 1
include_additional_keys: null
eval_metrics:
  - ${as_tuple:"reward","mean"}
  - ${as_tuple:"reward","sum"}