
defaults:
    - override /hydra/launcher: submitit_slurm

wandb_tag: expfinale_tests3

is_test: False
env: CartPole-v1
seed : 0

experiment_id: test
experiment_id_new: test

# adversary related
adv_append_past: True
adv_append_wm: False
action_scale: 0.3
adv_algo: SAC # A2C, SAC, PPO, TD3 # no other algorithms implemented currently
ill_rew_zero_w_tol: True
tolerance: 0.05 # TODO figure out what the best tolerance is for mujoco
illusionary_reward_weight: 0 # set to "only" to ignore victim reward
append_l2: False
use_reduced_distance: False

mnp_attack: False
no_attack: False

# victim related
victim_noise_sigma: 0
victim_algo: sac
victim_loadfrom: -1

# Steps and frequencies
n_steps_vic_per_meta: 400
n_adv_steps_per_vic_step: all # set to 'all' to only train adversary
n_train_steps_combined: 4000000 # TODO figure out how long to run mujoco for...

evaluate_exploitability: False

save_freq: 50000
eval_freq: 100
n_eval_episodes: 30

n_meta_episodes: -1
n_steps_total_vic: -1
n_steps_total_adv: -1

# general
train: True
evaluate: True
render: False

# logging related
wandb_project_name: cotrain
wandb_entity: anonymous

wandb_run_id: tbd
working_directory: tbd
use_wandb: True

output_dir: "/work/anonymous"
task_name: "animals_v2"


# launcher
hydra:
    verbose: True
    job:
        chdir: True
    launcher:
        submitit_folder: logs/multiruns/.submitit/%j
        timeout_min: 1
        cpus_per_task: 4
        gpus_per_node: 0
        # partition: gpu
        # constraint: p40
        tasks_per_node: 1
        mem_gb: 15
        nodes: 1
        name: ${experiment_id_new}
        _target_: hydra_plugins.hydra_submitit_launcher.submitit_launcher.SlurmLauncher
        comment: null
        exclude: gnodec1 # ,gnoded3,gnodeb1
        max_num_timeout: 0
        additional_parameters: {time: "47:59:00"}
        array_parallelism: 100
        setup: null
    run:
        dir: ${output_dir}/illusory/${task_name}/${now:%Y-%m-%d}_${now:%H-%M-%S}_${experiment_id_new}/${env}/${hydra.job.override_dirname}
    sweep:
        dir: ${output_dir}/illussory/${task_name}/${now:%Y-%m-%d}_${now:%H-%M-%S}_${experiment_id_new}/${env}
        subdir: ${hydra.job.override_dirname}
