defaults:
  - _self_
  - env: atari

hydra:
  job:
    chdir: True

wandb:
  mode: online
  project: null
  entity: null
  name: null
  group: null
  tags: null
  notes: null

initialization:
  path_to_ckpt: null
  load_wm: True
  load_ac: True

common:
  device: cuda:0
  seed: null
  resume: False # do not modify, set by scripts/resume.sh only.

collection:
  path_to_static_dataset: null
  train:
    num_envs: 1
    stop_after_epochs: 1000
    config:
      num_steps_first_epoch: 100
      num_steps: 100
      epsilon: 0.01
  test:
    num_envs: 4
    config:
      num_episodes: 1
      epsilon: 0.0

training:
  should: True
  epochs: 1500
  save_agent_every: 10 # use -1 to save last epoch only
  cache_in_ram: False
  model_free: False # if True, turn off world_model training and RL in imagination
  
  denoiser:
    start_after_epochs: 0
    steps_first_epoch: 2000
    steps_per_epoch: 300
    batch_size: 32
    learning_rate: 1e-4
    weight_decay: 1e-2
    epsilon: 1e-8
    lr_warmup_steps: 500
    max_grad_norm: 1.0
    grad_acc_steps: 1
  
  rew_end:
    start_after_epochs: 0
    steps_first_epoch: 2000
    steps_per_epoch: 300
    batch_size: 32
    learning_rate: 1e-4
    weight_decay: 1e-2
    epsilon: 1e-8
    lr_warmup_steps: 500
    max_grad_norm: 1.0
    grad_acc_steps: 1
    
  actor_critic:
    imagination_horizon: 20
    num_steps: 20
    batch_size: 32
    grad_acc_steps: 1
    start_after_epochs: 0
    steps_first_epoch: 2000
    steps_per_epoch: 300
    learning_rate: 1e-4
    weight_decay: 1e-2
    epsilon: 1e-8
    lr_warmup_steps: 500
    max_grad_norm: 1.0
    gamma: 0.997
    lambda_: 0.95
    entropy_weight: 0.001

evaluation:
  should: True
  every: 1

############################################################################
############################### MODELS #####################################
############################################################################

world_model:
  _target_: models.diffuser.WorldModelConfig
  image_size: 64
  image_channels: 3
  num_actions: null
  num_steps_conditioning: 4
  sigma_data: 0.5
  sigma_offset_noise: 0.3

##################################################################################
##################################################################################
##################################################################################
