# Training parameters
total_timesteps: 2_000_000
learning_rate: 2.0e-4
num_envs: 16
num_steps: 256
num_minibatches: 32
update_epochs: 10

env_id: "fetch-v0"
#env_id: "traffic-stop-all-v0"

# Environment parameters
real: 1
ego_speed: 0.4
tb2_speed: 0.4
num_frames: 8
num_noise: 0
edge: 0
mujoco: 0

seeds:
  - 1
  - 2
  - 3
  - 4
  - 5


# General Attack Parameters Important!
robust: 1
p_rates:
  - 0.01

# SleeperNets Parameters
alpha: 1

# TrojDRL Parameters
strong: 1

# TrojDRL + SleeperNets Parameters
rew_p: 1 
clip: 0
True_Bound: 0

# Daze Parameters
dazer: "simplex"
num_daze: 10
start_poisoning: 25

# Attack flags
sn_outer: 1
daze: 0
trojdrl: 0

# Target action
target_action:
  - 1.0
  - 1.0

# Logging
wandb_project_name: "daze-test"
exp_name: "init"
#track: 0
#unique_id: 1757444662 # Filled at runtime, set for testing

# Depricated Parameters - Keep them just in case!
exp: false
dist_type: "nll"
inception: 0
badrl: 0
badbots: 0
learned: 0