library(dplyr)
library(randomForest)
library(ggplot2)
library(MASS) 
library(rsample)
#install.packages("medicaldata")
library(medicaldata)

library(dplyr)
library(randomForest)
library(ggplot2)
library(MASS) 
library(rsample)
library(nnet)


outer_data<- list()
outer_delta <- list()


set.seed(123)

data(licorice_gargle, package = "medicaldata")
licorice_gargle <- licorice_gargle[-c(113,123), ]
licorice_gargle <- licorice_gargle %>% rename(A = treat)
print(names(licorice_gargle))

# Define the variables to be used as W's and V's
binary_vars <- c( "extubation_cough")
w_vars <- sample(binary_vars, 1) 
v_vars <- setdiff(c( "preOp_calcBMI", "preOp_age", "preOp_pain", "preOp_mallampati","preOp_asa","preOp_smoking"), w_vars)  # Remaining variables as V
print(v_vars)

# Convert W variables to factors if necessary
#licorice_gargle[w_vars] <- lapply(licorice_gargle[w_vars], as.factor)

# Select one main outcome variable (e.g., 'pacu30min_cough')
outcome_vars <- c("extubation_cough", "pacu30min_cough", "pacu30min_throatPain", "pacu30min_swallowPain",
                  "pacu90min_cough", "pacu90min_throatPain", "postOp4hour_cough", "postOp4hour_throatPain",
                  "pod1am_cough", "pod1am_throatPain")

# Select one main outcome variable (e.g., 'pacu30min_cough') and rename it to 'Y'
main_outcome <- "pacu30min_swallowPain"  # Choose one main outcome variable
names(licorice_gargle)[names(licorice_gargle) == main_outcome] <- "Y"

# Select desired columns
desired_columns <- c(w_vars, v_vars, "A", "Y")
licorice_gargle <- licorice_gargle[, desired_columns]

# Randomly assign E=1 (RCT) or E=0 (observational) to each row
licorice_gargle$E <- sample(c(0, 1), nrow(licorice_gargle), replace = TRUE)

# Create the combined data with the 'E' column added
data <- licorice_gargle

# Define the range of the outcome variable 'Y'
a <- min(licorice_gargle$Y[licorice_gargle$E == 1], na.rm = TRUE)
b <- max(licorice_gargle$Y[licorice_gargle$E == 1], na.rm = TRUE)

names(data)[1:1] <- paste0("W_", 1:1)
names(data)[2:7] <- paste0("V_", 1:6)

experiment_data <- data[data$E == 1, ]
observational_data <- data[data$E == 0, ]



# Fit the models
lm_mu_11 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5  + W_1 , data =  data[data$A == 1, ])
lm_mu_00 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5 + W_1 , data = data[data$A == 0, ])

# Predict the response
data$beta_A <- predict(lm_mu_11, newdata = data, type = "response") - predict(lm_mu_00, newdata = data, type = "response")





# Fit logistic regression models for mu_1(V) and mu_0(V) within the experimental group (E == 1)
lm_mu_1 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5, data = experiment_data[experiment_data$A == 1, ])
lm_mu_0 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5, data = experiment_data[experiment_data$A == 0, ])

lm_mu_11 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5+W_1, data = data[data$A == 1, ])
lm_mu_00 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5+W_1, data = data[data$A == 0, ])

data$beta_A <-  predict(lm_mu_11, data, type="response") - predict(lm_mu_00, data, type="response")

# Fit logistic regression models for the probabilities using only the V covariates
glm_p_A1_E1_given_V <- glm(as.factor(I(A * E)) ~ V_1 + V_2 + V_3 + V_4 + V_5, data = data, family = binomial)
glm_p_A0_E1_given_V <- glm(as.factor(I((1 - A) * E)) ~ V_1 + V_2 + V_3 + V_4 + V_5, data = data, family = binomial)
glm_p_E0_given_V <- glm(as.factor(I(1 - E)) ~ V_1 + V_2 + V_3 + V_4 + V_5, data = data, family = binomial)

# PREDICTION PHASE (expectations)
data$mu_1 <- predict(lm_mu_1, data, type="response")
data$mu_0 <- predict(lm_mu_0, data, type="response")

# Predict the probabilities
data$prob_A1_E1 <- predict(glm_p_A1_E1_given_V, data, type = "response")
data$prob_A0_E1 <- predict(glm_p_A0_E1_given_V, data, type = "response")
data$prob_E0 <- predict(glm_p_E0_given_V, data, type = "response")


# Updated function to fit and predict with multinomial logistic regression for one W variable
fit_predict_W_combinations_lr <- function(data, observational_data, w_var, v_vars) {
  # Ensure W variable is a factor
  observational_data[[w_var]] <- factor(observational_data[[w_var]])
  
  # Fit a multinomial logistic regression model
  formula <- as.formula(paste(w_var, "~", paste(v_vars, collapse = "+")))
  model <- multinom(formula, data = observational_data)
  
  # Predict probabilities of each W combination
  prob_predictions <- predict(model, newdata = data, type = "probs")
  
  # Adding predicted probabilities to the original data
  levels_w <- levels(observational_data[[w_var]])
  for (level in levels_w) {
    data[[paste0("prob_W_", level)]] <- prob_predictions[, level]
  }
  
  return(data)
}

# Then you call this function on your data
data <- fit_predict_W_combinations_lr(data, observational_data, "W_1", paste0("V_", 1:6))

# formatted_combinations <- c("prob_W_0_0_0", "prob_W_0_0_1", "prob_W_0_1_0", "prob_W_0_1_1",
#                             "prob_W_1_0_0", "prob_W_1_0_1", "prob_W_1_1_0", "prob_W_1_1_1")
# data[, formatted_combinations] <- prob_df

# Getting list of probability w types
prob_columns <- grep("prob_W_", names(data), value = TRUE)

n <- nrow(data[data$E == 1, ])
m <- nrow(data[data$E == 0, ])

indices <- which(data$E == 0)

# Precompute the column names based on 'prob_col'
prob_col_names <- paste("prob_W", data$W_1[indices], sep = "_")
print(prob_col_names)
# Initialize the prob_w column
data$prob_w <- NA

# Find indices where E == 0
indices <- which(data$E == 0)

for (i in seq_along(indices)) {
  idx <- indices[i]
  
  # Ensure the column name is valid and index exists
  if (i <= length(prob_col_names) && prob_col_names[i] %in% names(data)) {
    col_name <- prob_col_names[i]
    
    # Safely extract a single numeric value
    data$prob_w[idx] <- as.numeric(data[idx, col_name])
  } else {
    warning("Column does not exist or index out of bounds: ", prob_col_names[i])
  }
}

# Function to parse W values from column names and create g vector
create_g_vector <- function(data_row, col_name) {
  # Parse W values from col_name based on assumed format like 'prob_W_0_1_1'
  w_values <- as.numeric(strsplit(substr(col_name, 8, nchar(col_name)), "_")[[1]])
  
  # Extract V values from the row
  v_values <- as.numeric(data_row[grep("V_", names(data_row))])
  
  # Combine V and W values
  return(c(v_values, w_values))
}




E1_indices <- which(data$E == 1)



num_v_w_vars <- 7  # Adjust number of W vars as needed
#flag=1 is if you are using ground truth data



for (col_name in prob_columns) {
  data[[col_name]] <- pmax(data[[col_name]], .01)
}
data$mu_1 <- as.numeric(data$mu_1)
data$mu_0 <- as.numeric(data$mu_0)

print(mean(data$mu_1-data$mu_0))

true_delta = max(as.numeric(data$beta_A)-(as.numeric(data$mu_1)-as.numeric(data$mu_0)))

setting_value <- data
delta_max1 = b-a - mean(data$mu_1-data$mu_0)
delta_max = delta_max1

delta_range <- seq(delta_max, 0, length.out = 10)
for (delta in delta_range){
  data <- setting_value
  bounds <- list()
  bounds_plug_in_model <- list()
  for (i in 1:2) {
  if (i == 1) {
    width <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 +delta)
    }
    width2 <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 -delta)
    }
    
    
    f <- function(b, a, mu1, mu0, tau_d) {
      tau_value <- tau(b, a, mu1, mu0, tau_d) -width2(b, a, mu1, mu0, tau_d)
      return(as.numeric(tau_value >= 0))
    }
    
    tau_n <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d))
    }
    
    tau <- function(b, a, mu1, mu0, tau_d) {
      return(as.numeric((mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d)) / tau_d))
    }
  } else {
    width <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 -delta)
    }
    width2 <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 +delta)
    }
    
    f <- function(b, a, mu1, mu0, tau_d) {
      tau_value <- tau(b, a, mu1, mu0, tau_d) -width2(b, a, mu1, mu0, tau_d)
      return(as.numeric(tau_value <= 0))
    }
    
    tau_n <- function(b, a, mu1, mu0, tau_d) {
      return(mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d))
    }
    
    tau <- function(b, a, mu1, mu0, tau_d) {
      return(as.numeric((mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d)) / tau_d))
    }
  }
  
  print(prob_columns)
  
  
  # # Initialize a zero vector of the correct length to accumulate results
  # E1A1_sum <- numeric(num_v_w_vars)
  # 
  # # Apply function across each observation and accumulate results
  # apply(data[data$E == 1 & data$A == 1, ], 1, function(data_row) {
  #   temp_results <- numeric(num_v_w_vars)
  #   # Loop over each probability column
  #   for (col_name in prob_columns) {
  #     data_row <- as.numeric(data_row)
  #     g_vector <- create_g_vector(data_row, col_name)
  #     print(g_vector)
  #     f_value <- f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), as.numeric(data_row[col_name]))
  #     current <- (as.numeric(data_row["E"]) * as.numeric(data_row["A"]) / as.numeric(data_row["prob_A1_E1"])) * (as.numeric(data_row["Y"]) - as.numeric(data_row["mu_1"])) * f_value * g_vector
  #     temp_results <- temp_results + current
  #     print(temp_results)
  #   }
  #   # Accumulate the temporary results into the final vector
  #   E1A1_sum <<- E1A1_sum + temp_results
  # })
  # 
  # # EXPERIMENTAL DATA (E=1), A=0
  # E1A0_sum <- numeric(num_v_w_vars)
  # apply(data[data$E == 1 & data$A == 0, ], 1, function(data_row) {
  #   temp_results <- numeric(num_v_w_vars)
  #   # Loop over each probability column
  #   for (col_name in prob_columns) {
  #     g_vector <- create_g_vector(data_row, col_name)
  #     f_value <- f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), as.numeric(data_row[col_name]))
  #     current <- (as.numeric(data_row["E"]) * (1 - as.numeric(data_row["A"])) / as.numeric(as.numeric(data_row["prob_A0_E1"]))) * (as.numeric(data_row["Y"]) - as.numeric(data_row["mu_0"])) * f_value * g_vector
  #     temp_results <- temp_results + current
  #   }
  #   # Accumulate the temporary results into the final vector
  #   E1A0_sum <<- E1A0_sum + temp_results
  # })
  # 
  # # Observational Data (E=0)
  # E0_P1 <- numeric(num_v_w_vars)
  # 
  # # Apply function across each observation where E == 0
  # apply(data[data$E == 0, ], 1, function(data_row) {
  #   prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
  #   prob_W_value <- data_row[prob_col_name]  # Extract the probability value associated with the W configuration
  #   g_vector <- create_g_vector(data_row, prob_col_name)
  #   result_contributions <- ((width) * (1 - as.numeric(data_row["E"])) / as.numeric(data_row["prob_E0"])) * g_vector * f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value)
  #   E0_P1 <<- E0_P1 + result_contributions
  # })
  # 
  # E0_P2 <- numeric(num_v_w_vars)
  # 
  # # Apply function across each observation and accumulate results
  # apply(data[data$E == 0, ], 1, function(data_row) {
  #   temp_results <- numeric(num_v_w_vars)
  #   # Loop over each probability column
  #   for (col_name in prob_columns) {
  #     g_vector <- create_g_vector(data_row, col_name)
  #     f_value <- f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), as.numeric(data_row[col_name]))
  #     current <- ((width) * (1 - as.numeric(data_row["E"])) / as.numeric(data_row["prob_E0"])) * f_value * g_vector * as.numeric(data_row[col_name])
  #     temp_results <- temp_results + current
  #   }
  #   # Accumulate the temporary results into the final vector
  #   E0_P2 <<- E0_P2 + temp_results
  # })
  # 
  # phi_21 <- numeric(num_v_w_vars)
  # 
  # # Apply function across each observation where E == 0
  # apply(data[data$E == 0, ], 1, function(data_row) {
  #   prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
  #   prob_W_value <- data_row[prob_col_name]  # Extract the probability value associated with the W configuration
  #   g_vector <- create_g_vector(data_row, prob_col_name)
  #   t_v <- tau(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value)
  #   result_contributions <- ((1 - as.numeric(data_row["E"])) / as.numeric(data_row["prob_E0"])) * g_vector * f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value) * t_v
  #   phi_21 <<- phi_21 + result_contributions
  # })
  # 
  # phi_22 <- numeric(num_v_w_vars)
  # apply(data[data$E == 0, ], 1, function(data_row) {
  #   data_row["mu_1"] <- as.numeric(data_row["mu_1"])
  #   data_row["mu_0"] <- as.numeric(data_row["mu_0"])
  #   as.numeric(data_row["prob_A1_E1"]) <- as.numeric(as.numeric(data_row["prob_A1_E1"]))
  #   as.numeric(as.numeric(data_row["prob_A0_E1"])) <- as.numeric(as.numeric(as.numeric(data_row["prob_A0_E1"])))
  #   as.numeric(data_row["prob_E0"]) <- as.numeric(as.numeric(data_row["prob_E0"]))
  #   as.numeric(data_row["Y"]) <- as.numeric(as.numeric(data_row["Y"]))
  #   as.numeric(data_row["E"]) <- as.numeric(as.numeric(data_row["E"]))
  #   print(as.numeric(data_row["E"]))
  #   as.numeric(data_row["A"]) <- as.numeric(as.numeric(data_row["A"]))
  #   temp_results <- numeric(num_v_w_vars)
  #   # Loop over each probability column
  #   for (col_name in prob_columns) {
  #     if (as.numeric(data_row[col_name]) == 0) {
  #       next  # Skip this column if the divisor would be zero
  #     }
  #     g_vector <- create_g_vector(data_row, col_name)
  #     f_value <- f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), as.numeric(data_row[col_name]))
  #     val_t <- tau_n(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), as.numeric(data_row[col_name]))
  #     current <- ((1 - as.numeric(as.numeric(data_row["E"]))) / as.numeric(data_row["prob_E0"])) * f_value * g_vector * val_t
  #     temp_results <- temp_results + current
  #   }
  #   # Accumulate the temporary results into the final vector
  #   phi_22 <<- phi_22 + temp_results
  # })
  
  extra <- numeric(num_v_w_vars)
  
  # Apply function across each observation where E == 0
  apply(data[data$E == 0, ], 1, function(data_row) {
    data_row["mu_1"] <- as.numeric(data_row["mu_1"])
    data_row["mu_0"] <- as.numeric(data_row["mu_0"])
    data_row["prob_A1_E1"] <- as.numeric(as.numeric(data_row["prob_A1_E1"]))
    data_row["prob_A0_E1"] <- as.numeric(as.numeric(as.numeric(data_row["prob_A0_E1"])))
    data_row["prob_E0"] <- as.numeric(as.numeric(data_row["prob_E0"]))
    data_row["Y"] <- as.numeric(as.numeric(data_row["Y"]))
    #data_row <- as.numeric(data_row)
    temp_results <- numeric(num_v_w_vars)
    print(data_row["W_1"])
    prob_col_name <- paste("prob_W", paste(data_row["W_1"], sep = "_"), sep = "_")
    print(prob_col_name)
    if (as.numeric(data_row[prob_col_name]) == 0) {
      next  # Skip this column if the divisor would be zero
    }
    prob_W_value <-as.numeric(data_row[prob_col_name] )  # Extract the probability value associated with the W configuration
    g_vector <- create_g_vector(data_row, prob_col_name)
    t <- tau(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value)
    f_val <- f(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value)
    current <- g_vector * (t * f_val - (width2(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value)) * f_val + width2(b, a, as.numeric(data_row["mu_1"]), as.numeric(data_row["mu_0"]), prob_W_value))
    extra <<- extra + current
  })
  
  denom <- numeric(num_v_w_vars)
  avg_g <- numeric(num_v_w_vars)
  
  apply(data[data$E == 0, ], 1, function(data_row) {
    prob_col_name <- paste("prob_W", paste(data_row["W_1"], sep = "_"), sep = "_")
    g_vector <- create_g_vector(data_row, prob_col_name)
    current <- g_vector %*% t(g_vector)
    denom <<- denom + current
    avg_g <<- avg_g + g_vector
  })
  
  #total_sum <- E1A1_sum - E1A0_sum + E0_P1 - E0_P2 - phi_21 + phi_22 + ((n + m) / m) * extra
  #total_sum <- ginv(denom / m) %*% (total_sum / (n + m))
  total_sum_plug <- ginv(denom / m) %*% (extra / m)
  bounds <- append(bounds_plug_in_model, list(total_sum_plug))
  bounds_plug_in_model <- append(bounds_plug_in_model, list(total_sum_plug))
  }
  
  
  #print(bounds_plug_in_model[1:2])
  #print(bounds_plug_in_model[3:4])
  E0_indices <- which(data$E == 0)
  
  
  
  data$true_lower <- NA
  data$true_upper <- NA
  data$influence_lower <- NA
  data$influence_upper <- NA
  data$plug_in_model_lower <- NA
  data$plug_in_model_upper <- NA
  data$coverage_general <- NA
  data$coverage_true <- NA
  data$coverage_influence <- NA
  data$coverage_plug_in <- NA
  
  coverage <- list()
  influence_values <- list()
  plug_models <- list()
  influence_loss <- list()
  plug_in_loss <- list()
  print(bounds[[1]])
  # Function to compute influence values
  compute_influence <- function(data_row) {
  prob_col_name <- paste("prob_W", paste(data_row["W_1"], sep = "_"), sep = "_")
  g_vector <- create_g_vector(data_row, prob_col_name)
  print(g_vector)
  # Compute current influence
  current1 <- sum(as.numeric(g_vector) * bounds[[1]])
  current2 <- sum(as.numeric(g_vector) * bounds[[2]])
  current3 <- sum(as.numeric(g_vector) * bounds_plug_in_model[[1]])
  current4 <- sum(as.numeric(g_vector) * bounds_plug_in_model[[2]])
  
  data_row["influence_lower"] <- current1
  data_row["influence_upper"] <- current2 
  data_row["plug_in_model_lower"] <- current3
  data_row["plug_in_model_upper"] <- current4
  data_row["coverage_influence"] <- as.numeric(current1 <= as.numeric(data_row["beta_A"]) & data_row["beta_A"] <= current2)
  data_row["coverage_plug_in"] <- as.numeric(current3 <= as.numeric(data_row["beta_A"]) & data_row["beta_A"] <= current4)
  
  #influence_loss <<- append(influence_loss, abs(current5 - current1) + abs(current6 - current2))
  #plug_in_loss <<- append(plug_in_loss, abs(current5 - current3) + abs(current6 - current4))
  influence_values <<- append(influence_values, list(c(current1, current2)))
  plug_models <<- append(plug_models, list(c(current3, current4)))
  return(data_row)
  }
  
  data[data$E == 0, ] <- t(apply(data[data$E == 0, ], 1, compute_influence))
  
  
  # Convert the list to a numeric vector
  influence_vector <- unlist(influence_values)
  plug_model_vector <- unlist(plug_models)
  
  

  outer_data <- append(outer_data, list(data))
  outer_delta <- append(outer_delta, list(delta))
  
  
  
}