#!/usr/bin/env bash

# Launcher for AntFall using split env/intrinsic rewards with TD3 dual critics.

set -euo pipefail

SEED=${SEED:-19}
GPU=${GPU:-0}
MAN_REW=${MAN_REW:-0.24}
MAN_NOISE=${MAN_NOISE:-0.6}
USE_ADJ=${USE_ADJ:-1}
INTR_BETA=${INTR_BETA:-1.0}

if [[ "$USE_ADJ" -eq 0 ]]; then
  echo "[GPU ${GPU}] Running AntFall split-rewards (seed=${SEED}) man_rew_scale=${MAN_REW} beta=${INTR_BETA} (adj_net=off)"
else
  echo "[GPU ${GPU}] Running AntFall split-rewards (seed=${SEED}) man_rew_scale=${MAN_REW} beta=${INTR_BETA} (adj_net=on)"
fi

ARGS=(
  --env_name AntFall
  --algo "HAWK_AntFall_split_s${SEED}"
  --seed "$SEED"
  --man_rew_scale "$MAN_REW"
  --manager_td3_arch TD3-dual-critics
  --man_intrinsic_beta "$INTR_BETA"
  --manager_propose_freq 10
  --train_manager_freq 10
  --man_ctrl_rew_balance_start 0.1
  --man_ctrl_rew_balance_end 0.32
  --man_ctrl_rew_balance_steps 320000
  --man_noise_sigma "$MAN_NOISE"
  --reach_warmup_samples 3000
  --reach_warmup_rounds 1
)

if [[ "$USE_ADJ" -eq 0 ]]; then
  ARGS+=(--disable_adj_net)
fi

CUDA_VISIBLE_DEVICES=$GPU \
python main.py "${ARGS[@]}"

echo "Run finished."
