# Hypergrid environment configuration

environment:
  name: "hypergrid"
  type: "HypergridEnvironment"

  # Hypergrid parameters
  height: 30
  ndim: 5
  reward_beta: 10.0
  reward_at_corners: 1e-5

  # State and action dimensions
  state_dim: 5 # Same as ndim
  action_dim: 11 # 2 * ndim + 1 (movement actions + terminate)

# Difficulty levels for scalability experiments (RQ6)
difficulty_levels:
  easy:
    height: 10
    ndim: 3
    state_dim: 3
    action_dim: 7

  medium:
    height: 20
    ndim: 4
    state_dim: 4
    action_dim: 9

  hard:
    height: 30
    ndim: 5
    state_dim: 5
    action_dim: 11

# Evaluation metrics specific to Hypergrid
metrics:
  target_l1_error: 0.1
  target_mode_coverage: 0.95
  convergence_patience: 500
