

# Function to generate a Slurm job script with variable parameters
generate_slurm_job <- function(job_name, shapley_file, model_path_file = NULL, cpdag_path_file = NULL, method = NULL, 
                                ncomb=NULL, nmc=1024, nobs=1024, nbatches=64, time="1:00:00", array="1-40",
                                partition="rome", move_logs = FALSE) {
  if (!is.null(model_path_file) && !is.null(cpdag_path_file)) {
    stop("Only one of model_path_file and cpdag_path_file can be specified.")
  }

  if (grepl("mec", shapley_file) && is.null(cpdag_path_file)) {
    stop("MEC requires a cpdag_path_file.")
  }

  if (grepl("mec", shapley_file) && is.null(method)) {
    stop("MEC requires a method.")
  }

  if (!is.null(model_path_file) && grepl("R/experiments", model_path_file)) {
    stop("model_path_file should be relative to the jobs folder.")   
  }
  if (!is.null(cpdag_path_file) && grepl("R/experiments", cpdag_path_file)) {
    stop("cpdag_path_file should be relative to the jobs folder.")   
  }

  
  lines <- list()

  lines <- append(lines, "#!/bin/bash\n")
  
  # SLURM directives
  lines <- append(lines, paste0("#SBATCH --partition=", partition))
  lines <- append(lines, paste0("#SBATCH --job-name=", job_name))
  lines <- append(lines, paste0("#SBATCH --ntasks=", 1))
  lines <- append(lines, paste0("#SBATCH --cpus-per-task=", 16))
  lines <- append(lines, paste0("#SBATCH --time=", time))
  if (grepl("%", array)) {
    lines <- append(lines, paste0("#SBATCH --array=", array))
  } else {
    lines <- append(lines, paste0("#SBATCH --array=", array, "%8"))
  }


  lines <- append(lines, paste0("#SBATCH --output=", job_name, "_%A_%a.out\n"))
  
  # Modules and initial path setup
  lines <- append(lines, "module purge")
  lines <- append(lines, "module load 2023")
  lines <- append(lines, "module load R/4.3.2-gfbf-2023a\n")

  lines <- append(lines, "# Your job starts in the directory where you call sbatch")
  lines <- append(lines, "cd $HOME/mec_shapley/\n")

  
  # Model path setup
  lines <- append(lines, "# Path to your combined settings file")
  
  if (!is.null(model_path_file)) {
    lines <- append(lines, paste0("MODEL_PATH_FILE=\"$HOME/mec_shapley/R/experiments/jobs/", model_path_file, "\"\n"))
  } else if (!is.null(cpdag_path_file)) {
    lines <- append(lines, paste0("MODEL_PATH_FILE=\"$HOME/mec_shapley/R/experiments/jobs/", cpdag_path_file, "\"\n"))
  }
  
  # Job execution logic
  lines <- append(lines, "for i in {1..1}; do  # Adjust the number of parallel runs")
  #job_script <- paste(job_script, "for i in {1..1}; do  # Adjust the number of parallel runs\n")
  
  rscript_line <- paste0("  Rscript $HOME/mec_shapley/R/experiments/", shapley_file)
  if (!is.null(model_path_file)) {
    rscript_line <- paste0(rscript_line, " --modelpath $(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
  } else if (!is.null(cpdag_path_file)) {
    rscript_line <- paste0(rscript_line, " --cpdagpath $(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
  }
  rscript_line <- paste0(rscript_line, " --ntoexplain 40 ")
  rscript_line <- paste0(rscript_line, " --nmc ", nmc, " --nobs ", nobs)
  if (!is.null(ncomb)) {
    rscript_line <- paste0(rscript_line, " --ncomb ", ncomb)
  }
  rscript_line <- paste0(rscript_line, " --nbatches ", nbatches)

  if (!is.null(method)) {
    rscript_line <- paste0(rscript_line, " --method ", method)
  }

  rscript_line <- paste0(rscript_line, " &")
  
  lines <- append(lines, rscript_line)
  lines <- append(lines, "done\n")
  lines <- append(lines, "wait")
  
  if (move_logs) {
    # Move log file to model path directory
    lines <- append(lines, "# Move log file to model path directory")
    lines <- append(lines, "MODEL_PATH=$(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
    lines <- append(lines, paste0("LOG_FILE=\"$HOME/mec_shapley/", job_name, "_${SLURM_JOB_ID}_${SLURM_ARRAY_TASK_ID}.out\""))
    lines <- append(lines, "mv $LOG_FILE $MODEL_PATH/")
  }
  

  return(lines)
}


# Function to generate a Slurm job script with variable parameters
generate_slurm_job_variable <- function(job_name, shapley_file, model_path_file = NULL, cpdag_path_file = NULL,
                                        method = NULL,
                               ncomb=NULL, nmc=1024, nobs=1024, nbatches=64, time="1:00:00", array="1-40",
                               partition="rome", move_logs = FALSE) {
  if (!is.null(model_path_file) && !is.null(cpdag_path_file)) {
    stop("Only one of model_path_file and cpdag_path_file can be specified.")
  }

  if (grepl("mec", shapley_file) && is.null(cpdag_path_file)) {
    stop("MEC requires a cpdag_path_file.")
  }

  if (grepl("mec", shapley_file) && is.null(method)) {
    stop("MEC requires a method.")
  }

  if (!is.null(model_path_file) && grepl("R/experiments", model_path_file)) {
    stop("model_path_file should be relative to the jobs folder.")   
  }
  if (!is.null(cpdag_path_file) && grepl("R/experiments", cpdag_path_file)) {
    stop("cpdag_path_file should be relative to the jobs folder.")   
  }

  lines <- list()

  lines <- append(lines, "#!/bin/bash\n")
  
  # SLURM directives
  lines <- append(lines, paste0("#SBATCH --partition=", partition))
  lines <- append(lines, paste0("#SBATCH --job-name=", job_name))
  lines <- append(lines, paste0("#SBATCH --ntasks=", 1))
  lines <- append(lines, paste0("#SBATCH --cpus-per-task=", 16))
  lines <- append(lines, paste0("#SBATCH --time=", time))
  if (grepl("%", array)) {
    lines <- append(lines, paste0("#SBATCH --array=", array))
  } else {
    lines <- append(lines, paste0("#SBATCH --array=", array, "%8"))
  }

  lines <- append(lines, paste0("#SBATCH --output=", job_name, "_%A_%a.out\n"))
  
  # Modules and initial path setup
  lines <- append(lines, "module purge")
  lines <- append(lines, "module load 2023")
  lines <- append(lines, "module load R/4.3.2-gfbf-2023a\n")

  lines <- append(lines, "# Your job starts in the directory where you call sbatch")
  lines <- append(lines, "cd $HOME/mec_shapley/\n")
  
  # Model path setup
  lines <- append(lines, "# Path to your combined settings file")
  
  if (!is.null(model_path_file)) {
    lines <- append(lines, paste0("MODEL_PATH_FILE=\"$HOME/mec_shapley/R/experiments/jobs/", model_path_file, "\"\n"))
  } else if (!is.null(cpdag_path_file)) {
    lines <- append(lines, paste0("MODEL_PATH_FILE=\"$HOME/mec_shapley/R/experiments/jobs/", cpdag_path_file, "\"\n"))
  }
  
  # Job execution logic for multiple values
  param_name <- NULL
  param_values <- NULL
  
  if (length(nmc) > 1) {
    param_name <- "nmc"
    param_values <- nmc
  } else if (length(nobs) > 1) {
    param_name <- "nobs"
    param_values <- nobs
  } else if (length(ncomb) > 1) {
    param_name <- "ncomb"
    param_values <- ncomb
  } else {
    param_values <- list(nmc)
    param_name <- "nmc"
  }
  
  for (param_val in param_values) {
    rscript_line <- paste0("Rscript $HOME/mec_shapley/R/experiments/", shapley_file)
    if (!is.null(model_path_file)) {
      rscript_line <- paste0(rscript_line, " --modelpath $(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
    } else if (!is.null(cpdag_path_file)) {
      rscript_line <- paste0(rscript_line, " --cpdagpath $(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
    }
    rscript_line <- paste0(rscript_line, " --ntoexplain 40 ")
    
    if (param_name == "nmc") {
      rscript_line <- paste0(rscript_line, " --nmc ", param_val, " --nobs ", nobs)
    } else if (param_name == "nobs") {
      rscript_line <- paste0(rscript_line, " --nmc ", nmc, " --nobs ", param_val)
    } else if (param_name == "ncomb") {
      rscript_line <- paste0(rscript_line, " --nmc ", nmc, " --nobs ", nobs, " --ncomb ", param_val)
    }
    
    rscript_line <- paste0(rscript_line, " --nbatches ", nbatches)
  
    if (!is.null(method)) {
      rscript_line <- paste0(rscript_line, " --method ", method)
    }
  
    lines <- append(lines, rscript_line)
  }

  if (move_logs) {
    # Move log file to model path directory
    lines <- append(lines, "# Move log file to model path directory")
    lines <- append(lines, "MODEL_PATH=$(head -$(($SLURM_ARRAY_TASK_ID)) $MODEL_PATH_FILE | tail -1)")
    lines <- append(lines, paste0("LOG_FILE=\"$HOME/mec_shapley/", job_name, "_${SLURM_JOB_ID}_${SLURM_ARRAY_TASK_ID}.out\""))
    lines <- append(lines, "mv $LOG_FILE $MODEL_PATH/")
  }
  
  return(lines)
}