## Script to generate data for all previously generated SCM

source("R/scm/graph_functions.R")
source("R/scm/node_functions.R")
source("R/scm/binary_scm.R")
source("R/scm/additive_noise_scm.R")
source("R/scm/linear_gaussian_scm.R")

source("R/experiments/helper_functions.R")

n_samples_observational <- 10000
n_samples_to_explain <- 100

generate_data_for_scm <- function(file_path) {
  log_to_shell(paste0("Generating data for ", file_path, "..."))
  scm_and_parameters <- readRDS(file_path)
  scm <- scm_and_parameters$scm
  scm_type <- scm_and_parameters$scm_type
  n_nodes <- scm_and_parameters$n_nodes
  n_expected_neighbors <- scm_and_parameters$n_expected_neighbors
  n_expected_parents_y <- scm_and_parameters$n_expected_parents_y
  seed <- scm_and_parameters$seed


  data_observational <- generate_data(scm, n_samples_observational, seed)
  data_to_explain <- generate_data(scm, n_samples_to_explain, seed)

  log_to_shell(paste0("Saving data for ", file_path, "..."))
  save_data(data_observational, data_to_explain, scm_type, file_path, n_nodes, n_expected_neighbors, n_expected_parents_y, seed)
}

generate_data_for_each_scm <- function() {
  scm_base_folder <- "experiments/2_scms/"
  scm_type_folders <- list.dirs(scm_base_folder, recursive = FALSE)
  for (scm_type_folder in scm_type_folders) {
    n_nodes_folders <- list.dirs(scm_type_folder, recursive = FALSE)
    for (n_nodes_folder in n_nodes_folders) {
      n_nodes <- basename(n_nodes_folder)
      n_nodes <- as.integer(gsub("\\D", "", n_nodes))

      dag_type_folders <- list.dirs(n_nodes_folder, recursive = FALSE)
      for (dag_type_folder in dag_type_folders) {
        for (file_path in list.files(dag_type_folder, full.names = TRUE)) {
          if (grepl(".rds$", file_path)) {
            generate_data_for_scm(file_path)
          }
        }
      }
    }
  }
}

generate_data_for_each_scm()