# @package _global_
env_type: atari

# Choose environment via a selector group (env=atari|minigrid|procgen)
defaults:
  - /experiment: default
  - /value_fn: default
  - /optimizer: default
  - /envs/dqn: atari
  - _self_

experiment:
  num_threads: 1
  gpu: 0
  wandb_entity: your-entity
  wandb_project_name: "Hyperbolic RL - Atari Paper"
  tag: hyper-srym
  track: true

# Env settings
env_id: BreakoutNoFrameskip-v4
total_timesteps: 10000000

# Optimizer settings
optimizer:
  algorithm: adam
  learning_rate: 1e-4
  adams_eps: 2.5e-5

# Q-overrides
value_fn:
  curvature: 1.0
  manifold: poincare
  regularization: sn
  feature_scaling: dim
  forward_pass: HRL_forward
  small_weights: false
  manifold_dtype: float32
  manifold_params_dtype: float32
  # Value loss parameters
  loss_fn: mse
  loss_num_bins: 51
  loss_min_value: -10.0
  loss_max_value: 10.0

# DDQN settings
embedding_dim: 512
last_layer_tanh: false
batch_size: 32
buffer_size: 1000000
learning_starts: 80000
train_frequency: 4
target_network_frequency: 1000
tau: 1.0
gamma: 0.99
start_e: 1.0
end_e: 0.01
exploration_fraction: 0.10

encoder_log_frequency: 100000
compute_embedding_metrics: false
