#!/bin/bash

# Load necessary modules

# Change directory to the script location
cd "$HOME/mec_shapley//"

# Generate a timestamp
TIMESTAMP=$(date +"%Y%m%d_%H%M%S")

# Define output log file with timestamp
LOG_FILE="$HOME/mec_shapley/R/experiments/jobs/non-linear1/causal_discovery/non-linear1_ncd_$TIMESTAMP.log"

# Path to the combined settings file
MODEL_PATH_FILE="$HOME/mec_shapley/R/experiments/jobs/non-linear1/causal_discovery/data_paths_non-linear1_base_cd.txt"

# Export the necessary environment variables
export MODEL_PATH_FILE

# Function to process a single line from the MODEL_PATH_FILE with different parameters
process_line() {
    local line="$1"
    local param="$2"
    Rscript "$HOME/mec_shapley/R/experiments/causal_discovery_pc.R" "$line" "$param" 0.05
}

# Export the function so it can be used by parallel
export -f process_line

# Use GNU Parallel to process each line with different parameters in parallel with a limit on the number of concurrent jobs
NUM_CONCURRENT_JOBS=20

# Generate the commands for parallel execution
cat "$MODEL_PATH_FILE" | while read -r line; do
    echo "process_line '$line' 250"
    echo "process_line '$line' 500"
    echo "process_line '$line' 2000"
    echo "process_line '$line' 4000"
done | parallel --jobs $NUM_CONCURRENT_JOBS > "$LOG_FILE" 2>&1