#!/usr/bin/env bash

# Launcher for AntMaze with tuned intrinsic weighting.

set -euo pipefail

SEED=${SEED:-7}
GPU=${GPU:-0}
MAN_REW=${MAN_REW:-0.4}        # intrinsic weight (scaled internally per env)

echo "[GPU ${GPU}] Running AntMaze (seed=${SEED}) with man_rew_scale=${MAN_REW}"

CUDA_VISIBLE_DEVICES=$GPU \
python main.py \
  --env_name AntMaze \
  --algo "HAWK_AntMaze_s${SEED}_new" \
  --seed "$SEED" \
  --man_rew_scale "$MAN_REW" \
  --manager_propose_freq 10 \
  --train_manager_freq 10 \
  --man_ctrl_rew_balance_start 0.0 \
  --man_ctrl_rew_balance_end 0.2 \
  --man_ctrl_rew_balance_steps 300000

echo "Run finished."
