_target_: src.algorithms.AURORA

defaults:
  - qd: cma_mae
  - _self_

agent:
  _target_: src.agents.ToeplitzAgent # src.agents.MLPAgent
  layers: [128, 128]  # Hidden layer sizes
  activation: "tanh"
  state_dim: ${env.state_dim}
  action_dim: ${env.action_dim}

encoder:
  _target_: src.embeddings.TrajectoryEncoder
  state_dim: ${env.state_dim}
  latent_dim: ${algorithm.measures_dim}  # Dimension of measures
  hidden_dim: 32
  num_layers: 1
  teacher_force: true
  device: ${device}

# Encoder training parameters
encoder_training:
  batch_size: 64
  epochs: 50
  learning_rate: 1e-3
  validation_split: 0.2
  patience: 10

use_lstm: true
measures_dim: 4
measure_margin: 0.1  # Margin for archive ranges
traj_sampling_freq: 10 # Following QDAX implementation
total_iterations: 500
update_interval: [20, 50, 100, 200, 300]  # Encoder update schedule
n_evals: 5  # Evaluations per solution