NUM_SEEDS: 1
SEED: 0
WANDB_MODE: "online"
ENTITY: "your_wandb_entity"
PROJECT: "iclr_2026_emb_lambda"
alg:
  WANDB_LOG_ALL_SEEDS: False
SAVE_PATH: "./models"
ALG_NAME: "emb_lambda"
TOTAL_TIMESTEPS: 5e7
TOTAL_TIMESTEPS_DECAY: 5e7
NUM_ENVS: 128
NUM_STEPS: 32
EPS_START: 1.
EPS_FINISH: 0.001
EPS_DECAY: 0.1
NUM_EPOCHS: 2
NUM_MINIBATCHES: 32
NORM_TYPE: "layer_norm"
LR: 0.00025
MAX_GRAD_NORM: 10
LR_LINEAR_DECAY: False
GAMMA: 0.99
LAMBDA: 0.4
MAX_BOOTSTRAP_STEPS: 32
ENV_NAME: "NameThisGame-v5"
ENV_KWARGS: 
  episodic_life: True
  reward_clip: True
  repeat_action_probability: 0.
  frame_skip: 4
  noop_max: 30
TEST_DURING_TRAINING: True 
TEST_ENVS: 8
EPS_TEST: 0.