# Training parameters
total_timesteps: 2_000_000
learning_rate: 3.0e-4
num_envs: 1
num_steps: 2048
env_id: "Hopper-v5"
mujoco: 1
n_eval: 100

seeds:
  - 1
  - 2
  - 3
# num_minibatches: 4
# update_epochs: 4

# # PPO hyperparameters
# clip_coef: 0.2
# ent_coef: 0.01
# vf_coef: 0.5
# max_grad_norm: 0.5
# target_kl: null
# norm_adv: true
# clip_vloss: true

# Attack parameters - Daze
dazer: "simplex"
num_daze: 8

# Attack parameters - Inception
n_updates: 512
True_Bound: 0
start_poisoning: -1
#buffer_size: 500000
batch_incept: 256

#Attack parameters - SleeperNets
alpha: 1

#Attack parameters - TrojDRL
strong: 0

#Attack parameters - General
robust: 0
p_rates:
  - 0.01
  - 0.005
  - 0.0025
  - 0.02

exp: false
dist_type: "nll"

rew_p: 5 #SN/TrojDRL
clip: 0 #SN/TrojDRL

# Attack flags
sn_outer: 0
daze: 0
inception: 0
trojdrl: 0
badrl: 0
badbots: 0
learned: 0

# Target action
target_action:
  - -1.0
  - -1.0
  - -1.0
  # - -1.0
  # - -1.0
  # - -1.0
  # - -1.0

# Logging
wandb_project_name: "hopper-daze"
exp_name: "init"
#unique_id: 1753158812
#track: 1
