determine_n_combinations <- function(n_nodes, n_samples_expectation) {
  return(NULL)
}

get_opt_parser <- function() {
  option_list <- list(
    optparse::make_option("--modelpath", type="character", default=NULL,
                  help="Path to model file [default %default]"),
    optparse::make_option("--cpdagpath", type="character", default=NULL,
                  help="Path to cpdag file [default %default]"),
    optparse::make_option("--dagpath", type="character", default=NULL,
                  help="Path to dag file [default %default]"),

    optparse::make_option("--method", type="character", default="sample",
                help="Method to use for approximating interventional expectations [sample|iw] [default %default]"),
    optparse::make_option("--ntoexplain", type="integer", default=NULL,
                help="Number of samples to explain [default %default]"),
    optparse::make_option("--nobs", type="integer", default=NULL,
                help="Number of observational samples used for distribution estimation/iw [default %default]"),
    optparse::make_option("--nmc", type="integer", default=NULL,
                  help="Number of Monte Carlo samples used to approximate expectations [default %default]"),
    optparse::make_option("--ncomb", type="integer", default=NULL,
                  help="Number of combinations for Shapley value estimation [default %default]"),


    optparse::make_option("--cpdagidx", type="integer", default=NULL,
                    help="Index of DAG in CPDAG file [default %default]"),
    optparse::make_option("--nbatches", type="integer", default=NULL,
                  help="Number of batches for Shapley value estimation [default %default]")
  )
  return(optparse::OptionParser(option_list=option_list))
}


save_dag <- function(dag, n_nodes, min_parents_y, n_expected_neighbors, n_expected_parents_y, seed) {
  base_folder <- 'experiments/1_dags'
  n_nodes_folder <- paste0(base_folder, '/', n_nodes, '_nodes')
  # min_parents_y is fixed for the number of nodes
  type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')

  if (!dir.exists(type_folder)) {
    dir.create(type_folder, recursive = TRUE)
  }

  file_path <- paste0(type_folder, '/', seed, '.rds')
  dag_and_parameters <- list(dag = dag, n_nodes = n_nodes, min_parents_y = min_parents_y, n_expected_neighbors = n_expected_neighbors, n_expected_parents_y = n_expected_parents_y, seed = seed)
  saveRDS(dag_and_parameters, file_path)

  # Save settings to log file
  settings_line <- sprintf(
    "%65s, seed: %3d, n_nodes: %3d, min_parents_y: %3d, n_expected_neighbors: %3d, n_expected_parents_y: %3d",
    file_path, seed, n_nodes, min_parents_y, n_expected_neighbors, n_expected_parents_y
  )
  log_append_to_file(settings_line, paste0(type_folder, '/log.txt'))
}

save_scm <- function(scm, scm_type, dag_path, n_nodes, n_expected_neighbors, n_expected_parents_y, seed) {
  base_folder <- 'experiments/2_scms'

  # Check if n_nodes, n_expected_neighbors and n_expected_parents_y match dag_dir
  stopifnot(grepl(paste0(n_nodes, '_nodes'), dag_path))
  stopifnot(grepl(paste0(n_expected_neighbors, '_neighbors'), dag_path))
  stopifnot(grepl(paste0(n_expected_parents_y, '_parents_y'), dag_path))

  scm_type_folder <- paste0(base_folder, '/', scm_type)
  n_nodes_folder <- paste0(scm_type_folder, '/', n_nodes, '_nodes')
  dag_type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')


  if (!dir.exists(dag_type_folder)) {
    dir.create(dag_type_folder, recursive = TRUE)
  }

  file_path <- paste0(dag_type_folder, '/', seed, '.rds')
  scm_and_parameters <- list(scm = scm,
                             scm_type = scm_type,
                             n_nodes = n_nodes,
                             n_expected_neighbors = n_expected_neighbors,
                             n_expected_parents_y = n_expected_parents_y,
                             seed = seed,
                             dag_path = dag_path)
  saveRDS(scm_and_parameters, file_path)

  # Save settings to log file
  settings_line <- sprintf(
    "%65s, seed: %2d, type: %12s, dag file: %65s, n_nodes: %3d, n_expected_neighbors: %3d, n_expected_parents_y: %3d",
    file_path, seed, scm_type, dag_path, n_nodes, n_expected_neighbors, n_expected_parents_y
  )

  log_append_to_file(settings_line, paste0(dag_type_folder, '/log.txt'))
}


save_data <- function(data_observational, data_to_explain, scm_type, scm_path, n_nodes, n_expected_neighbors, n_expected_parents_y, seed) {
  base_folder <- 'experiments/3_data'

  # Check if n_nodes, n_expected_neighbors and n_expected_parents_y match dag_dir
  stopifnot(grepl(paste0(n_nodes, '_nodes'), scm_path))
  stopifnot(grepl(paste0(n_expected_neighbors, '_neighbors'), scm_path))
  stopifnot(grepl(paste0(n_expected_parents_y, '_parents_y'), scm_path))

  scm_type_folder <- paste0(base_folder, '/', scm_type)
  n_nodes_folder <- paste0(scm_type_folder, '/', n_nodes, '_nodes')
  dag_type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')

  if (!dir.exists(dag_type_folder)) {
    dir.create(dag_type_folder, recursive = TRUE)
  }

  file_path <- paste0(dag_type_folder, '/', seed, '.rds')
  data_and_parameters <- list(data_observational = data_observational,
                              data_to_explain = data_to_explain,
                              scm_type = scm_type,
                              n_nodes = n_nodes,
                              n_expected_neighbors = n_expected_neighbors,
                              n_expected_parents_y = n_expected_parents_y,
                              seed = seed,
                              scm_path = scm_path)
  saveRDS(data_and_parameters, file_path)

  # Save settings to log file
    settings_line <- sprintf(
      "%65s, seed: %2d, type: %12s, scm file: %65s, n_nodes: %3d, n_expected_neighbors: %3d, n_expected_parents_y: %3d",
      file_path, seed, scm_type, scm_path, n_nodes, n_expected_neighbors, n_expected_parents_y
    )

  log_append_to_file(settings_line, paste0(dag_type_folder, '/log.txt'))
}

save_model <- function(model, model_type, scm_type, data_path, n_training_points, n_nodes, n_expected_neighbors, n_expected_parents_y, seed, ...) {
  base_folder <- 'experiments/4_models'

  # Check if n_nodes, n_expected_neighbors and n_expected_parents_y match dag_dir
  stopifnot(grepl(paste0(n_nodes, '_nodes'), data_path))
  stopifnot(grepl(paste0(n_expected_neighbors, '_neighbors'), data_path))
  stopifnot(grepl(paste0(n_expected_parents_y, '_parents_y'), data_path))

  model_type_folder <- paste0(base_folder, '/', model_type)
  scm_type_folder <- paste0(model_type_folder, '/', scm_type)
  n_nodes_folder <- paste0(scm_type_folder, '/', n_nodes, '_nodes')
  dag_type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')

  if (!dir.exists(dag_type_folder)) {
    dir.create(dag_type_folder, recursive = TRUE)
  }

  file_path <- paste0(dag_type_folder, '/', seed, '.rds')

  model_and_parameters <- list(model = model,
                               model_type = model_type,
                               scm_type = scm_type,
                               data_path = data_path,
                               n_training_points = n_training_points,
                               n_nodes = n_nodes,
                               n_expected_neighbors = n_expected_neighbors,
                               n_expected_parents_y = n_expected_parents_y,
                               seed = seed,
                               ...
                               )

  if (!(file.access(dirname(file_path), mode = 2) == 0)) {
    log_to_shell(paste0("Cannot write to directory: ", dirname(file_path)))
    log_to_shell(paste0("Working directory: ", getwd()))
    stop("Exiting.")
  }

  log_to_shell(paste0("Saving model to ", file_path))
  # Also save xgboost model to file (see https://www.rdocumentation.org/packages/xgboost/versions/1.7.7.1/topics/a-compatibility-note-for-saveRDS-save)
  # Update 27/04: saving xgboost model using saveRDS now returning error
  if (model_type == "xgboost") {
    xgboost_filepath <- paste0(dag_type_folder, '/', seed, '_xgb.model')
    xgboost::xgb.save(model, xgboost_filepath)
    model_and_parameters$xgboost_path <- xgboost_filepath
  }

  saveRDS(model_and_parameters, file_path)


  settings_line <- sprintf(
    "%65s, seed: %2d, type: %12s, data_path: %65s, n_training_points: %6d, n_nodes: %3d, n_expected_neighbors: %3d, n_expected_parents_y: %3d",
    file_path, seed, model_type, data_path, n_training_points, n_nodes, n_expected_neighbors, n_expected_parents_y
  )

  log_append_to_file(settings_line, paste0(dag_type_folder, '/log.txt'))
}

name_explanation <- function(explanation, explanation_type, seed,
                             n_observational, n_samples_expectation, n_combinations,
                             n_batches,
                             cpdag_path = NULL, cpdag_dag_idx = NULL){

  # Extract number of nodes
  n_nodes <- ncol(explanation$internal$data$x_explain) + 1

  # Extract number of samples explained
  n_samples_explained <- nrow(explanation$internal$data$x_explain)

  # suffix <- NULL
  # if (grepl("causal", explanation_type)) {
  #   # If we provided cpdag_path and cpdag_idx, we can extract the name of the cpdag
  #   # Format is always seed_name_cpdag.rds
  #   if (!is.null(cpdag_dag_idx)) {
  #     filename <- basename(cpdag_path)
  #     name <- sub("^\\d+_(.*)_cpdag\\.rds$", "\\1", filename)
  #     suffix <- paste0(name, '_dag_', cpdag_dag_idx)
  #   } else {
  #     suffix <- 'true_dag'
  #   }
  # }

  # Add cpdag path to explanation_type
  if (!is.null(cpdag_path)) {
    filename <- basename(cpdag_path)
    cpdag_name <- sub("^\\d+_(.*)_cpdag\\.rds$", "\\1", filename)
    explanation_type <- paste0(cpdag_name, '_', explanation_type)
    if (!is.null(cpdag_dag_idx)) {
      explanation_type <- paste0(explanation_type, '_dag_', cpdag_dag_idx)
    }
  }

  # Create save name
  if (is.null(n_combinations)) {
    n_combinations_for_name <- 2^(n_nodes - 1)
  } else {
    n_combinations_for_name <- n_combinations
  }

  name <- paste0(seed, '_', explanation_type, '_',
                 n_observational, 'O_',
                 n_samples_expectation, 'E_',
                 n_combinations_for_name, 'C_',
                 n_batches, 'B_',
                 n_samples_explained, 'S'
                 )

  # if (!is.null(suffix)) {
  #   name <- paste0(name, '_', suffix)
  # }

  return(name)
}

generate_unique_filename <- function(folder, base_filename) {
  counter <- 0
  new_filename <- base_filename

  # Check if the file exists and append incrementing numbers until it doesn't
  file_path <- paste0(folder, '/', new_filename, '.rds')
  while (file.exists(file_path)) {
    counter <- counter + 1
    # Append the counter to the base filename before the file extension
    new_filename <- paste0(base_filename, "_", counter)
    file_path <- paste0(folder, '/', new_filename, '.rds')
  }

  return(new_filename)
}


save_explanation <- function(explanation, explanation_type, model_and_parameters, model_path,
                             n_observational, n_samples_expectation, n_combinations_shapr,
                             n_batches, duration, cpdag_dag_idx = NULL, cpdag_path = NULL, ...) {
  base_folder <- 'experiments/6_explanations'
  scm_type <- model_and_parameters$scm_type
  n_nodes <- model_and_parameters$n_nodes
  n_expected_neighbors <- model_and_parameters$n_expected_neighbors
  n_expected_parents_y <- model_and_parameters$n_expected_parents_y
  seed <- model_and_parameters$seed

  model_type_folder <- paste0(base_folder, '/', model_and_parameters$model_type)
  scm_type_folder <- paste0(model_type_folder, '/', scm_type)
  n_nodes_folder <- paste0(scm_type_folder, '/', n_nodes, '_nodes')
  dag_type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')

  if (!dir.exists(dag_type_folder)) {
    dir.create(dag_type_folder, recursive = TRUE)
  }

  file_name <- name_explanation(explanation, explanation_type, seed,
                                    n_observational, n_samples_expectation, n_combinations_shapr,
                                    n_batches, cpdag_path = cpdag_path, cpdag_dag_idx = cpdag_dag_idx)
  generated_filename <- generate_unique_filename(dag_type_folder, file_name)
  file_path <- paste0(dag_type_folder, '/', generated_filename, '.rds')

  shapley_values <- explanation$shapley_values
  shapr_timings <- explanation$timing

  explanation_and_parameters <- list(shapley_values = shapley_values,
                                     shapr_timings = shapr_timings,
                                      explanation_type = explanation_type,
                                      model_path = model_path,
                                      n_observational = n_observational,
                                      n_samples_expectation = n_samples_expectation,
                                      n_combinations_shapr = n_combinations_shapr,
                                      n_batches = n_batches,
                                      duration = duration,
                                      scm_type = scm_type,
                                      n_nodes = n_nodes,
                                      n_expected_neighbors = n_expected_neighbors,
                                      n_expected_parents_y = n_expected_parents_y,
                                      seed = seed,
                                      cpdag_dag_idx = cpdag_dag_idx,
                                      cpdag_path = cpdag_path,
                                     ...
  )
  log_to_shell(paste0("Saving explanation to ", file_path))
  saveRDS(explanation_and_parameters, file_path)

  # Save settings to log file
  settings_line <- sprintf(
    "%65s, seed: %2d, type: %12s, model_path: %65s, n_observational: %6d, n_samples_expectation: %6d, n_combinations_shapr: %6d, n_batches: %6d",
    file_path, seed, explanation_type, model_path, n_observational, n_samples_expectation, n_combinations_shapr, n_batches
  )

  log_append_to_file(settings_line, paste0(dag_type_folder, '/log.txt'))
}

save_cpdag <- function(cpdag, dags, name, scm_type, n_nodes, n_expected_neighbors, n_expected_parents_y, seed,
                       true_dag_path = NULL, data_path = NULL, n_observational = NULL, ...) {
  base_folder <- 'experiments/5_causal_discovery'
  scm_type_folder <- paste0(base_folder, '/', scm_type)
  n_nodes_folder <- paste0(scm_type_folder, '/', n_nodes, '_nodes')
  dag_type_folder <- paste0(n_nodes_folder, '/', n_expected_neighbors, '_neighbors', '_', n_expected_parents_y, '_parents_y')

  if (!dir.exists(dag_type_folder)) {
    dir.create(dag_type_folder, recursive = TRUE)
  }

  file_path_cpdag <- paste0(dag_type_folder, '/', seed, '_', name, '_cpdag.rds')
  cpdag_and_parameters <- list(cpdag = cpdag,
                               dags = dags,
                               n_dags = length(dags),
                               name = name,
                               scm_type = scm_type,
                               n_nodes = n_nodes,
                               n_expected_neighbors = n_expected_neighbors,
                               n_expected_parents_y = n_expected_parents_y,
                               seed = seed,
                               true_dag_path = true_dag_path,
                               data_path = data_path,
                               n_observational = n_observational,
                               ...)
  saveRDS(cpdag_and_parameters, file_path_cpdag)

  # Save settings to log file
  settings_line <- sprintf(
    "%65s, seed: %2d, name: %12s, scm_type: %12s, true_dag_path: %65s, n_nodes: %3d, n_expected_neighbors: %3d, n_expected_parents_y: %3d",
    file_path_cpdag, seed, name, scm_type, true_dag_path, n_nodes, n_expected_neighbors, n_expected_parents_y
  )
  log_append_to_file(settings_line, paste0(dag_type_folder, '/log.txt'))
}



## Logging

log_to_shell <- function(msg) {
  time <- Sys.time()
  # Format DD-MM_YY hr:min:sec
  time <- format(time, format = "%d-%m-%y %H:%M:%S")
  print(paste0('[', time, '] ', msg))
}

log_to_shell_milliseconds <- function(msg) {
  time <- Sys.time()
  # Format DD-MM_YY hr:min:sec
  time <- format(time, format = "%d-%m-%y %H:%M:%OS3")
  print(paste0('[', time, '] ', msg))
}

log_append_to_file <- function(msg, file_name) {
  time <- Sys.time()
  # Format DD-MM_YY hr:min:sec
  time <- format(time, format = "%d-%m-%y %H:%M:%S")
  raw_append_to_file(paste0('[', time, '] ', msg), file_name)
}

raw_append_to_file <- function(msg, file_name) {
  # Create file if it doesn't exist
  if (!file.exists(file_name)) {
    file.create(file_name)
    log_to_shell(paste0('Log file not found. Created file ', file_name))
  }

  con <- file(file_name, open = "a")
  writeLines(msg, con)
  close(con)
}

