# Configuration for Regular QD (with handcrafted measures)
_target_: src.algorithms.RegularQD

defaults:
  - qd: cma_mae
  - _self_

agent:
  _target_: src.agents.ToeplitzAgent # src.agents.MLPAgent
  layers: [128, 128] # List of ints, possibly empty
  activation: "tanh" # "relu" or "tanh"
  state_dim: ${env.state_dim}
  action_dim: ${env.action_dim}

measure_names: null # List of strings. Must match the names returned by the wrapper for each env
total_iterations: 500
n_evals: 5 # Number of trajectories used for policy evaluation (estimating return and embeddings)
