#!/usr/bin/env bash

# Launcher for AntFall with tuned intrinsic weighting for dense rewards.

set -euo pipefail

SEED=${SEED:-19}
GPU=${GPU:-0}
MAN_REW=${MAN_REW:-0.24}
MAN_NOISE=${MAN_NOISE:-0.6}
USE_ADJ=${USE_ADJ:-1}

if [[ "$USE_ADJ" -eq 0 ]]; then
  echo "[GPU ${GPU}] Running AntFall (seed=${SEED}) with man_rew_scale=${MAN_REW} (adj_net=off)"
else
  echo "[GPU ${GPU}] Running AntFall (seed=${SEED}) with man_rew_scale=${MAN_REW} (adj_net=on)"
fi

ARGS=(
  --env_name AntFall
  --algo "HAWK_AntFall_s${SEED}_strong"
  --seed "$SEED"
  --man_rew_scale "$MAN_REW"
  --manager_propose_freq 10
  --train_manager_freq 10
  --man_ctrl_rew_balance_start 0.1
  --man_ctrl_rew_balance_end 0.32
  --man_ctrl_rew_balance_steps 320000
  --man_noise_sigma "$MAN_NOISE"
  --reach_warmup_samples 3000
  --reach_warmup_rounds 1
)

if [[ "$USE_ADJ" -eq 0 ]]; then
  ARGS+=(--disable_adj_net)
fi

CUDA_VISIBLE_DEVICES=$GPU \
python main.py "${ARGS[@]}"

echo "Run finished."
