#!/bin/bash

# List of encoder names
encoders=("bow" "roberta" "MiniLM" "Mistral-7B" )

# List of datasets
datasets=("cora" "citeseer" "pubmed" "computer" "photo" "history" "wikics" "instagram" "reddit" "arxiv")

# Max concurrent jobs (adjust according to your system resources)
MAX_JOBS=2
current_jobs=0

for encoder in "${encoders[@]}"; do
  for dataset in "${datasets[@]}"; do

    # Construct the command
    if [[ "$encoder" == "Mistral-7B" ]]; then
      cmd="python embedding.py --encoder_name=$encoder --dataset=$dataset --use_cls=1"
    else
      cmd="python embedding.py --encoder_name=$encoder --dataset=$dataset"
    fi

    # Run in background
    echo "Running: $cmd"
    eval "$cmd" &

    ((current_jobs++))

    # If max jobs reached, wait for all to finish
    if [[ $current_jobs -ge $MAX_JOBS ]]; then
      wait
      current_jobs=0
    fi

  done
done

# Final wait in case some jobs are still running
wait
