#!/bin/bash

N=8
seeds=(0 1 2 3 4 5 6 7)
tasks=()


for seed in "${seeds[@]}"; do
    device=$(( seed % 4 ))

    # oracle
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Quadcopter-Direct-v0 --headless \
        agent.outer_loop.exploration=none agent.outer_loop.use_gradient=false agent.run_name=drone-oracle agent.outer_loop.start_with_oracle=True"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")

    # gradient
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Quadcopter-Direct-v0 --headless \
        agent.outer_loop.exploration=none agent.outer_loop.use_gradient=true agent.run_name=drone-gradient"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")

    # morse
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Quadcopter-Direct-v0 --headless \
        agent.outer_loop.exploration=single agent.outer_loop.use_gradient=true agent.run_name=drone-morse"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")

    # oracle
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Velocity-Flat-Unitree-A1-v0 --headless \
        agent.outer_loop.exploration=none agent.outer_loop.use_gradient=false agent.run_name=a1-oracle agent.outer_loop.start_with_oracle=True"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")

    # gradient
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Velocity-Flat-Unitree-A1-v0 --headless \
        agent.outer_loop.exploration=none agent.outer_loop.use_gradient=true agent.run_name=a1-gradient"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")

    # morse
    BASE_CMD="xvfb-run --auto-servernum -s '-screen 0 1280x1024x24' ./isaaclab.sh -p scripts/reinforcement_learning/rsl_rl/train.py --task=Isaac-Velocity-Flat-Unitree-A1-v0 --headless \
        agent.outer_loop.exploration=single agent.outer_loop.use_gradient=true agent.run_name=a1-morse"
    cmd="export CUDA_VISIBLE_DEVICES=$device; $BASE_CMD agent.seed=$seed"
    tasks+=("$cmd")
done


total_tasks=${#tasks[@]}
tasks_per_window=$(( (total_tasks + N - 1) / N ))
SESSION_NAME="isaaclab"

tmux kill-session -t $SESSION_NAME

tmux new-session -d -s $SESSION_NAME

for ((i = 0; i < N; i++)); do
  start=$((i * tasks_per_window))
  end=$((start + tasks_per_window - 1))
  [ $end -ge $total_tasks ] && end=$((total_tasks - 1))

  [ $start -gt $end ] && continue

  script=""
  for ((j = start; j <= end; j++)); do
    script+="${tasks[$j]}; "
  done

  if [ $i -eq 0 ]; then
    tmux send-keys -t $SESSION_NAME "$script" C-m
  else
    tmux new-window -t $SESSION_NAME
    tmux send-keys -t $SESSION_NAME:$i "$script" C-m
  fi
done

echo "send all commands to '$SESSION_NAME'"
tmux list-windows -t $SESSION_NAME
