#!/usr/bin/env bash

: "${ENV_NAME:=kitchen-complete-v0}"
: "${SEED:=1}"
: "${REPLAY:=mixed}"
: "${RR:=1}"                  # replay ratio (UTD)

echo "Environment Name: $ENV_NAME"
echo "Seed:             $SEED"
echo "Replay:           $REPLAY"
echo "UTD (RR):         $RR"

# Determine which launch script to use based on environment name
LAUNCH_SCRIPT=""
RESUME_PATH_PREFIX=""
RESUME_CHECKPOINT=""
PROJECT="test"
if [[ $ENV_NAME == *"kitchen"* ]]; then
    LAUNCH_SCRIPT="./experiments/scripts/kitchen/launch_sac_finetune.sh"
    # need to modify the path based on your own path
    RESUME_PATH_PREFIX="~/o2o_log/${ENV_NAME}_calql_seed"
    RESUME_CHECKPOINT="250000"
elif [[ $ENV_NAME == *"maze"* ]]; then
    LAUNCH_SCRIPT="./experiments/scripts/antmaze/launch_sac_finetune.sh"
    # need to modify the path based on your own path
    RESUME_PATH_PREFIX="~/o2o_log/${ENV_NAME}_calql_seed"
    RESUME_CHECKPOINT="1000000"
elif [[ $ENV_NAME == *"door"* ]] || [[ $ENV_NAME == *"pen"* ]] || [[ $ENV_NAME == *"relocate"* ]]; then
    LAUNCH_SCRIPT="./experiments/scripts/adroit/launch_sac_finetune.sh"
    # need to modify the path based on your own path
    RESUME_PATH_PREFIX="~/o2o_log/${ENV_NAME}_calql_seed"
    RESUME_CHECKPOINT="20000"
elif [[ $ENV_NAME == *"cheetah"* ]] || [[ $ENV_NAME == *"walker"* ]] || [[ $ENV_NAME == *"hopper"* ]]; then
    LAUNCH_SCRIPT="./experiments/scripts/locomotion/launch_sac_finetune.sh"
    # need to modify the path based on your own path
    RESUME_PATH_PREFIX="~/o2o_log/${ENV_NAME}_calql_seed"
    RESUME_CHECKPOINT="250000"
else
    echo "Unknown environment type: $ENV_NAME"
    exit 1
fi

GROUP="sac_${ENV_NAME}"

# Configure replay settings
case "$REPLAY" in
    warmup)
        warmup_steps=5000
        online_sampling_method="mixed"
        offline_data_ratio=0.0
        exp_name="warmup_${warmup_steps}"
        ;;
    append)
        warmup_steps=0
        online_sampling_method="append"
        offline_data_ratio=0.0
        exp_name="append"
        ;;
    no)
        warmup_steps=0
        online_sampling_method="mixed"
        offline_data_ratio=0.0
        exp_name="no"
        ;;
    mixed)
        warmup_steps=0
        online_sampling_method="mixed"
        offline_data_ratio=0.5
        exp_name="mixed_${offline_data_ratio}"
        ;;
    *)
        echo "Unknown replay type: $REPLAY"
        exit 1
        ;;
esac

chmod +x "$LAUNCH_SCRIPT"

ARGS=(
    --env "$ENV_NAME"
    --group "$GROUP"
    --project "$PROJECT"
    --seed "$SEED"
    --warmup_steps "$warmup_steps"
    --online_sampling_method "$online_sampling_method"
    --offline_data_ratio "$offline_data_ratio"
    --utd "$RR"
    --exp_name "$exp_name"
)

RESUME_PATH="${RESUME_PATH_PREFIX}${SEED}/checkpoint_${RESUME_CHECKPOINT}"
echo "Resume path: $RESUME_PATH"
ARGS+=(--resume_path "$RESUME_PATH")

echo "Launching: $LAUNCH_SCRIPT ${ARGS[*]}"
"$LAUNCH_SCRIPT" "${ARGS[@]}"


