#!/bin/bash

pkill -f random_shuffle_baseline.py

# Create directories
mkdir -p ./models
mkdir -p ./logs

# Launch each model on separate GPU(s) with random shuffle baseline
# Constant learning rate, randomly shuffled data (no curriculum)

# GPU 0: LFM2-350M
CUDA_VISIBLE_DEVICES=0 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model LFM2-350M --gpu 0 --lr 5e-5 --data_dir ./data/sft > logs/LFM2-350M.log 2>&1 &

# GPU 1: LFM2-700M  
CUDA_VISIBLE_DEVICES=1 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model LFM2-700M --gpu 1 --lr 5e-5 --data_dir ./data/sft > logs/LFM2-700M.log 2>&1 &

# GPU 2,3: LFM2-1.2B (2 GPUs)
CUDA_VISIBLE_DEVICES=2,3 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model LFM2-1.2B --gpu 2 --lr 5e-5 --data_dir ./data/sft > logs/LFM2-1.2B.log 2>&1 &

# GPU 4: SmolLM2-135M-Instruct
CUDA_VISIBLE_DEVICES=4 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model SmolLM2-135M-Instruct --gpu 4 --lr 5e-5 --data_dir ./data/sft > logs/SmolLM2-135M-Instruct.log 2>&1 &

# GPU 5: SmolLM2-360M-Instruct  
CUDA_VISIBLE_DEVICES=5 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model SmolLM2-360M-Instruct --gpu 5 --lr 5e-5 --data_dir ./data/sft > logs/SmolLM2-360M-Instruct.log 2>&1 &

# GPU 6,7: SmolLM2-1.7B-Instruct (2 GPUs)
CUDA_VISIBLE_DEVICES=6,7 nohup /home/nebius/argus/.venv/bin/python /home/nebius/argus/random_shuffle_baseline.py --model SmolLM2-1.7B-Instruct --gpu 6 --lr 5e-5 --data_dir ./data/sft > logs/SmolLM2-1.7B-Instruct.log 2>&1 &