library(dplyr)
library(randomForest)
library(ggplot2)
library(MASS) 
library(rsample)
library(nnet)
outer_bounds <- list()
outer_plug_in_bounds <- list()
outer_prob_df<- list()
outer_influence_values <- list()
outer_influence_loss<- list()
outer_plug_in_loss<- list()
outer_mae_propensity <- list()
outer_mae_outcome <- list()
outer_mae_probs <- list()
outer_data<- list()
outer_alpha <- list()
outer_delta <- list()

#flag =0 allows for potential manipulation of estimated values
set.seed(10)
flag <- 0

# Define the number of samples
n <- 10000

# Simulate 6 V covariates for both groups (3 continuous, 3 discrete)
V_continuous <- matrix(rnorm(n * 3, mean = 1, sd = .5), ncol = 3)
V_discrete <- matrix(rbinom(n * 3, size = 1, prob = 0.5), ncol = 3)

# Combine continuous and discrete V covariates
V <- cbind(V_continuous, V_discrete)

# Define the coefficients for the linear combination
coeffs_W1 <- runif(6, -1, 1)
coeffs_W2 <- runif(6, -1, 1)
coeffs_W3 <- runif(6, -1, 1)

# Compute the probabilities for each binary variable
prob_W1 <- plogis(rowSums(V * coeffs_W1))
prob_W2 <- plogis(rowSums(V * coeffs_W2))
prob_W3 <- plogis(rowSums(V * coeffs_W3))

# Function to compute probability combinations
compute_probabilities <- function(p1, p2, p3) {
  c(
    prob_W_0_0_0 = (1 - p1) * (1 - p2) * (1 - p3),
    prob_W_0_0_1 = (1 - p1) * (1 - p2) * p3,
    prob_W_0_1_0 = (1 - p1) * p2 * (1 - p3),
    prob_W_0_1_1 = (1 - p1) * p2 * p3,
    prob_W_1_0_0 = p1 * (1 - p2) * (1 - p3),
    prob_W_1_0_1 = p1 * (1 - p2) * p3,
    prob_W_1_1_0 = p1 * p2 * (1 - p3),
    prob_W_1_1_1 = p1 * p2 * p3
  )
}

# Generate binary variables from probabilities
generate_binary_variable <- function(prob) {
  rbinom(length(prob), 1, prob)
}

# Generate W columns based on the probabilities
W_1 <- generate_binary_variable(prob_W1)
W_2 <- generate_binary_variable(prob_W2)
W_3 <- generate_binary_variable(prob_W3)

W <- cbind(W_1, W_2, W_3)

# Create a matrix to store the probabilities for each observation
prob_matrix <- t(sapply(1:n, function(i) {
  compute_probabilities(prob_W1[i], prob_W2[i], prob_W3[i])
}))

# Add probability columns to the data frame
prob_df <- data.frame(prob_matrix)
names(prob_df) <- c("prob_W_0_0_0", "prob_W_0_0_1", "prob_W_0_1_0", "prob_W_0_1_1",
                    "prob_W_1_0_0", "prob_W_1_0_1", "prob_W_1_1_0", "prob_W_1_1_1")

# Combine with the main data
data <- data.frame(W_1 = W_1, W_2 = W_2, W_3 = W_3)

# Simulate E and A
p_E1GivenV <- plogis(rowSums(V) * runif(n, -1, 1))
E <- rbinom(n, size = 1, prob = p_E1GivenV)
p_AGivenVE1 <- plogis(rowSums(V) * runif(n, -1, 1))
A <- rbinom(n, size = 1, prob = p_AGivenVE1)

# Assume the treatment effect size and covariates effect sizes
beta_V <- runif(6, 1, 3) # Random effect sizes for V covariates
beta_W <- runif(3, 1, 3) # Random effect sizes for W covariates

beta_A_coef <- runif(9, 0, 1.5)  # Adjust the range and size as needed
# Compute beta_A as a function of V and W covariates
compute_beta_A <- function(V, W) {
  # Example: Linear combination of V and W values
  (rowSums(V * beta_A_coef[1:6]) + rowSums(W * beta_A_coef[7:9]))
}

# Compute beta_A for each observation
beta_A <- compute_beta_A(V, W)


# Calculate the outcome variable Y with beta_A dependent on V and W
Y <- beta_A * A + rowSums(W * beta_W) + rowSums(V * beta_V) + rnorm(n)

# Create the dataset with all variables
data <- cbind(data.frame(A, E, Y), data.frame(W), data.frame(V))

# Renaming W and V columns
names(data)[(ncol(data) - 8):(ncol(data) - 6)] <- paste0("W_", 1:3)
names(data)[(ncol(data) - 5):(ncol(data) - 0)] <- paste0("V_", 1:6)

# Separate the experimental and observational data for clarity
experiment_data <- data[data$E == 1, ]
observational_data <- data[data$E == 0, ]

a <- min(experiment_data$Y, na.rm = TRUE)
b <- max(experiment_data$Y, na.rm = TRUE)



# Fit logistic regression models for mu_1(V) and mu_0(V) within the experimental group (E == 1)
lm_mu_1 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5 + V_6, data = experiment_data[experiment_data$A == 1, ])
lm_mu_0 <- lm(Y ~ V_1 + V_2 + V_3 + V_4 + V_5 + V_6, data = experiment_data[experiment_data$A == 0, ])

# Fit logistic regression models for the probabilities using only the V covariates
glm_p_A1_E1_given_V <- glm(as.factor(I(A * E)) ~ V_1 + V_2 + V_3 + V_4 + V_5 + V_6, data = data, family = binomial)
glm_p_A0_E1_given_V <- glm(as.factor(I((1 - A) * E)) ~ V_1 + V_2 + V_3 + V_4 + V_5 + V_6, data = data, family = binomial)
glm_p_E0_given_V <- glm(as.factor(I(1 - E)) ~ V_1 + V_2 + V_3 + V_4 + V_5 + V_6, data = data, family = binomial)

# PREDICTION PHASE (expectations)
data$mu_1 <- predict(lm_mu_1, data, type="response")
data$mu_0 <- predict(lm_mu_0, data, type="response")

# Predict the probabilities
data$prob_A1_E1 <- predict(glm_p_A1_E1_given_V, data, type = "response")
data$prob_A0_E1 <- predict(glm_p_A0_E1_given_V, data, type = "response")
data$prob_E0 <- predict(glm_p_E0_given_V, data, type = "response")

# Updated function to fit and predict with multinomial logistic regression
fit_predict_W_combinations_lr <- function(data, observational_data, w_vars, v_vars) {
  # Ensure W variables are factors
  observational_data[w_vars] <- lapply(observational_data[w_vars], factor)
  
  # Create a combined W factor representing all combinations directly
  observational_data$W_combined <- apply(observational_data[, w_vars], 1, function(x) paste(x, collapse = "_"))
  observational_data$W_combined <- as.factor(observational_data$W_combined)  # Ensure it's a factor
  
  # Fit a multinomial logistic regression model
  formula <- as.formula(paste("W_combined ~", paste(v_vars, collapse = "+")))
  model <- multinom(formula, data = observational_data)
  
  # Predict probabilities of each W combination
  prob_predictions <- predict(model, newdata = data, type = "probs")
  
  # Adding predicted probabilities to the original data
  combined_levels <- levels(observational_data$W_combined)
  for (level in combined_levels) {
    data[[paste0("prob_W_", level)]] <- prob_predictions[, level]
  }
  
  return(data)
}

# Then you call this function on your data
data <- fit_predict_W_combinations_lr(data, observational_data, c("W_1", "W_2", "W_3"), paste0("V_", 1:6))
data$beta_A <- beta_A


# Getting list of probability w types
prob_columns <- grep("prob_W_", names(data), value = TRUE)

n <- nrow(data[data$E == 1, ])
m <- nrow(data[data$E == 0, ])

indices <- which(data$E == 0)

# Precompute the column names based on 'prob_col'
prob_col_names <- paste("prob_W", data$W_1[indices], data$W_2[indices], data$W_3[indices], sep = "_")

# Initialize the prob_w column
data$prob_w <- NA

# Find indices where E == 0
indices <- which(data$E == 0)

for (i in seq_along(indices)) {
  idx <- indices[i]
  
  # Ensure the column name is valid and index exists
  if (i <= length(prob_col_names) && prob_col_names[i] %in% names(data)) {
    col_name <- prob_col_names[i]
    
    # Safely extract a single numeric value
    data$prob_w[idx] <- as.numeric(data[idx, col_name])
  } else {
    warning("Column does not exist or index out of bounds: ", prob_col_names[i])
  }
}

# Function to parse W values from column names and create g vector
create_g_vector <- function(data_row, col_name) {
  # Parse W values from col_name based on assumed format like 'prob_W_0_1_1'
  w_values <- as.numeric(strsplit(substr(col_name, 8, nchar(col_name)), "_")[[1]])
  
  # Extract V values from the row
  v_values <- as.numeric(data_row[grep("V_", names(data_row))])
  
  # Combine V and W values
  return(c(v_values, w_values))
}



# Measuring Distance between True Values and Estimated Values
E1_indices <- which(data$E == 1)
# Predict the probabilities
data$true_prob_A1_E1 <- p_AGivenVE1
data$true_prob_A0_E1 <- 1 - p_AGivenVE1
data$true_prob_E1_v <- p_E1GivenV 

# For rows where E == 1, calculate probabilities
data$true_prob_A1_E1[E1_indices] <- (p_AGivenVE1 * p_E1GivenV)[E1_indices]
data$true_prob_A0_E1[E1_indices] <- ((1 - p_AGivenVE1) * p_E1GivenV)[E1_indices]

data$true_prob_E0 <- 1 - p_E1GivenV 
data$true_mu_1 <- beta_A + rowSums(W * beta_W) + rowSums(V * beta_V)
data$true_mu_0 <- rowSums(W * beta_W) + rowSums(V * beta_V)

formatted_combinations <- c("prob_W_0_0_0", "prob_W_0_0_1", "prob_W_0_1_0", "prob_W_0_1_1",
                            "prob_W_1_0_0", "prob_W_1_0_1", "prob_W_1_1_0", "prob_W_1_1_1")
original_data <- data

mae <- function(true_values, estimated_values) {
  mean(abs(true_values - estimated_values), na.rm = TRUE)
}



num_v_w_vars <- length(grep("V_", names(data))) + 3  # Adjust number of W vars as needed
#flag=1 is if you are using ground truth data



# alpha = runif(1, min = 0.1, max = 1)
# s <- sample(c(-1, 1), 1)
# data$mu_0 <- data$mu_0  +  mean(data$mu_0)*rnorm(n+m, mean = s*(n+m)^(-alpha), sd = (n+m)^(-alpha))
# data$mu_0 <- data$mu_1  +  mean(data$mu_1)*rnorm(n+m, mean = s*(n+m)^(-alpha), sd = (n+m)^(-alpha))
# data$prob_A1_E1 <- pmax(.005,data$prob_A1_E1 +  mean(data$prob_A1_E1)*rnorm(n+m, mean = s*(n+m)^(-alpha), sd = (n+m)^(-alpha)))
# data$prob_A0_E1 <- pmax(.005,data$prob_A0_E1 +  mean(data$prob_A1_E1)*rnorm(n+m, mean = s*(n+m)^(-alpha), sd = (n+m)^(-alpha)))
# data$prob_E0 <- pmax(.005,data$prob_E0+  mean(data$prob_A1_E1)*rnorm(n+m, mean = s*(n+m)^(-alpha), sd = (n+m)^(-alpha)))

# Calculate MAE for each of the TO-DO tasks
mae_prob_combinations <- sapply(formatted_combinations, function(col) {
  mae(data[[col]], prob_df[[col]])
})

mae_prob_A1_E1 <- mae(data$true_prob_A1_E1[E1_indices], data$prob_A1_E1[E1_indices])
mae_prob_A0_E1 <- mae(data$true_prob_A0_E1[E1_indices], data$prob_A0_E1[E1_indices])
mae_prob_E0 <- mae(data$true_prob_E0, data$prob_E0)
mae_mu_1 <- mae(data$true_mu_1, data$mu_1)
mae_mu_0 <- mae(data$true_mu_0, data$mu_0)

mae_propensity <- mae_prob_A1_E1 + mae_prob_A0_E1 + mae_prob_E0
mae_outcome <- mae_mu_1 + mae_mu_0 
mae_probs <- sum(mae_prob_combinations)

for (col_name in prob_columns) {
  data[[col_name]] <- pmax(data[[col_name]], .01)
}
setting_value <- data
delta_max1 = b-a - mean(data$mu_1-data$mu_0)
delta_max = delta_max1

delta_range <- seq(delta_max, 0, length.out = 10)
for (delta in delta_range){
  data <- setting_value
  bounds <- list()
  bounds_plug_in_model <- list()
  for (i in 1:4) {
    # i =1 means we are doing a lower-bound and i=2 means we are doing an upper bound
    if (i == 1 || i == 3) {
      width <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 +delta)
      }
      width2 <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 -delta)
      }

      
      f <- function(b, a, mu1, mu0, tau_d) {
        tau_value <- tau(b, a, mu1, mu0, tau_d) -width2(b, a, mu1, mu0, tau_d)
        return(as.numeric(tau_value >= 0))
      }
      
      tau_n <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d))
      }
      
      tau <- function(b, a, mu1, mu0, tau_d) {
        return(as.numeric((mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d)) / tau_d))
      }
    } else {
      width <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 -delta)
      }
      width2 <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 +delta)
      }
      
      f <- function(b, a, mu1, mu0, tau_d) {
        tau_value <- tau(b, a, mu1, mu0, tau_d) -width2(b, a, mu1, mu0, tau_d)
        return(as.numeric(tau_value <= 0))
      }
      
      tau_n <- function(b, a, mu1, mu0, tau_d) {
        return(mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d))
      }
      
      tau <- function(b, a, mu1, mu0, tau_d) {
        return(as.numeric((mu1 - mu0 - (width(b, a, mu1, mu0, tau_d)) * (1 - tau_d)) / tau_d))
      }
    }
    
    
    
    if (i == 3 || i == 4) {  # These are the true values
      E1_indices <- which(data$E == 1)
      # Predict the probabilities
      data$prob_A1_E1 <- p_AGivenVE1
      data$prob_A0_E1 <- 1 - p_AGivenVE1
      data$prob_E1_v <- p_E1GivenV 
      
      # For rows where E == 1, calculate probabilities
      data$prob_A1_E1[E1_indices] <- (p_AGivenVE1 * p_E1GivenV)[E1_indices]
      data$prob_A0_E1[E1_indices] <- ((1 - p_AGivenVE1) * p_E1GivenV)[E1_indices]
      
      data$prob_E0 <- 1 - p_E1GivenV 
      data$mu_1 <- beta_A + rowSums(W * beta_W) + rowSums(V * beta_V)
      data$mu_0 <- rowSums(W * beta_W) + rowSums(V * beta_V)
      
      formatted_combinations <- c("prob_W_0_0_0", "prob_W_0_0_1", "prob_W_0_1_0", "prob_W_0_1_1",
                                  "prob_W_1_0_0", "prob_W_1_0_1", "prob_W_1_1_0", "prob_W_1_1_1")
      data[, formatted_combinations] <- prob_df
    }
    
    # Initialize a zero vector of the correct length to accumulate results
    E1A1_sum <- numeric(num_v_w_vars)
    
    # Apply function across each observation and accumulate results
    apply(data[data$E == 1 & data$A == 1, ], 1, function(data_row) {
      temp_results <- numeric(num_v_w_vars)
      # Loop over each probability column
      for (col_name in prob_columns) {
        g_vector <- create_g_vector(data_row, col_name)
        f_value <- f(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])
        current <- (data_row["E"] * data_row["A"] / data_row["prob_A1_E1"]) * (data_row["Y"] - data_row["mu_1"]) * f_value * g_vector
        temp_results <- temp_results + current
      }
      # Accumulate the temporary results into the final vector
      E1A1_sum <<- E1A1_sum + temp_results
    })
    
    # EXPERIMENTAL DATA (E=1), A=0
    E1A0_sum <- numeric(num_v_w_vars)
    apply(data[data$E == 1 & data$A == 0, ], 1, function(data_row) {
      temp_results <- numeric(num_v_w_vars)
      # Loop over each probability column
      for (col_name in prob_columns) {
        g_vector <- create_g_vector(data_row, col_name)
        f_value <- f(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])
        current <- (data_row["E"] * (1 - data_row["A"]) / data_row["prob_A0_E1"]) * (data_row["Y"] - data_row["mu_0"]) * f_value * g_vector
        temp_results <- temp_results + current
      }
      # Accumulate the temporary results into the final vector
      E1A0_sum <<- E1A0_sum + temp_results
    })
    
    # Observational Data (E=0)
    E0_P1 <- numeric(num_v_w_vars)
    
    # Apply function across each observation where E == 0
    apply(data[data$E == 0, ], 1, function(data_row) {
      prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
      prob_W_value <- data_row[prob_col_name]  # Extract the probability value associated with the W configuration
      g_vector <- create_g_vector(data_row, prob_col_name)
      result_contributions <- ((width(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])) * (1 - data_row["E"]) / data_row["prob_E0"]) * g_vector * f(b, a, data_row["mu_1"], data_row["mu_0"], prob_W_value)
      E0_P1 <<- E0_P1 + result_contributions
    })
    
    E0_P2 <- numeric(num_v_w_vars)
    
    # Apply function across each observation and accumulate results
    apply(data[data$E == 0, ], 1, function(data_row) {
      temp_results <- numeric(num_v_w_vars)
      # Loop over each probability column
      for (col_name in prob_columns) {
        g_vector <- create_g_vector(data_row, col_name)
        f_value <- f(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])
        current <- ((width(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])) * (1 - data_row["E"]) / data_row["prob_E0"]) * f_value * g_vector * data_row[col_name]
        temp_results <- temp_results + current
      }
      # Accumulate the temporary results into the final vector
      E0_P2 <<- E0_P2 + temp_results
    })
    
    phi_21 <- numeric(num_v_w_vars)
    
    # Apply function across each observation where E == 0
    apply(data[data$E == 0, ], 1, function(data_row) {
      prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
      prob_W_value <- data_row[prob_col_name]  # Extract the probability value associated with the W configuration
      g_vector <- create_g_vector(data_row, prob_col_name)
      t_v <- tau(b, a, data_row["mu_1"], data_row["mu_0"], prob_W_value)
      result_contributions <- ((1 - data_row["E"]) / data_row["prob_E0"]) * g_vector * f(b, a, data_row["mu_1"], data_row["mu_0"], prob_W_value) * t_v
      phi_21 <<- phi_21 + result_contributions
    })
    
    phi_22 <- numeric(num_v_w_vars)
    apply(data[data$E == 0, ], 1, function(data_row) {
      temp_results <- numeric(num_v_w_vars)
      # Loop over each probability column
      for (col_name in prob_columns) {
        if (data_row[col_name] == 0) {
          next  # Skip this column if the divisor would be zero
        }
        g_vector <- create_g_vector(data_row, col_name)
        f_value <- f(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])
        val_t <- tau_n(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])
        current <- ((1 - data_row["E"]) / data_row["prob_E0"]) * f_value * g_vector * val_t
        temp_results <- temp_results + current
      }
      # Accumulate the temporary results into the final vector
      phi_22 <<- phi_22 + temp_results
    })
    
    extra <- numeric(num_v_w_vars)
    
    # Apply function across each observation where E == 0
    apply(data[data$E == 0, ], 1, function(data_row) {
      prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
      if (data_row[prob_col_name] == 0) {
        next  # Skip this column if the divisor would be zero
      }
      prob_W_value <- data_row[prob_col_name]  # Extract the probability value associated with the W configuration
      g_vector <- create_g_vector(data_row, prob_col_name)
      t <- tau(b, a, data_row["mu_1"], data_row["mu_0"], prob_W_value)
      f_val <- f(b, a, data_row["mu_1"], data_row["mu_0"], prob_W_value)
      current <- g_vector * (t * f_val - (width2(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name])) * f_val +width2(b, a, data_row["mu_1"], data_row["mu_0"], data_row[col_name]))
      extra <<- extra + current
    })
    
    denom <- numeric(num_v_w_vars)
    avg_g <- numeric(num_v_w_vars)
    
    apply(data[data$E == 0, ], 1, function(data_row) {
      prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
      g_vector <- create_g_vector(data_row, prob_col_name)
      current <- g_vector %*% t(g_vector)
      denom <<- denom + current
      avg_g <<- avg_g + g_vector
    })
    
    total_sum <- E1A1_sum - E1A0_sum + E0_P1 - E0_P2 - phi_21 + phi_22 + ((n + m) / m) * extra
    total_sum <- ginv(denom / m) %*% (total_sum / (n + m))
    total_sum_plug <- ginv(denom / m) %*% (extra / m)
    bounds <- append(bounds, list(total_sum))
    bounds_plug_in_model <- append(bounds_plug_in_model, list(total_sum_plug))
  }
  
  save <- 1
  if (save == 1) {
    true_plug_in_bounds <- bounds_plug_in_model[3:4]
  }
  #print(bounds_plug_in_model[1:2])
  #print(bounds_plug_in_model[3:4])
  E0_indices <- which(data$E == 0)
  plug_in_general_bounds <- list()
  
  plug_in_general <- with(data[data$E == 0, ], {
    low <- pmax((mu_1 - mu_0 - (b - a) * (1 - prob_w)) / prob_w, a - b)
    up <- pmin((mu_1 - mu_0 - (a - b) * (1 - prob_w)) / prob_w, b - a)
    plug_in_general_bounds <<- append(plug_in_general_bounds, list(low, up))
  })
  data$plug_in_general_lower <- NA
  data$plug_in_general_upper <- NA
  data$plug_in_general_lower[E0_indices] <- plug_in_general_bounds[[1]]
  data$plug_in_general_upper[E0_indices] <- plug_in_general_bounds[[2]]
  data$true_lower <- NA
  data$true_upper <- NA
  data$influence_lower <- NA
  data$influence_upper <- NA
  data$plug_in_model_lower <- NA
  data$plug_in_model_upper <- NA
  data$coverage_general <- NA
  data$coverage_true <- NA
  data$coverage_influence <- NA
  data$coverage_plug_in <- NA
  
  coverage <- list()
  influence_values <- list()
  plug_models <- list()
  influence_loss <- list()
  plug_in_loss <- list()
  
  
  compute_influence <- function(data_row) {
    prob_col_name <- paste("prob_W", paste(data_row["W_1"], data_row["W_2"], data_row["W_3"], sep = "_"), sep = "_")
    g_vector <- create_g_vector(data_row, prob_col_name)
    # Compute current influence
    current1 <- sum(g_vector * bounds[[1]])
    current2 <- sum(g_vector * bounds[[2]])
    current3 <- sum(g_vector * bounds_plug_in_model[[1]])
    current4 <- sum(g_vector * bounds_plug_in_model[[2]])
    current5 <- sum(g_vector * true_plug_in_bounds[[1]])
    current6 <- sum(g_vector * true_plug_in_bounds[[2]])
    data_row["true_lower"] <- current5
    data_row["true_upper"] <- current6
    data_row["influence_lower"] <- current1
    data_row["influence_upper"] <- current2
    data_row["plug_in_model_lower"] <- current3
    data_row["plug_in_model_upper"] <- current4
    data_row["coverage_general"] <- as.numeric(data_row["plug_in_general_lower"] <= data_row["beta_A"] & data_row["beta_A"] <= data_row["plug_in_general_upper"])
    data_row["coverage_true"] <- as.numeric(current5 <= data_row["beta_A"] & data_row["beta_A"] <= current6)
    data_row["coverage_influence"] <- as.numeric(current1 <= data_row["beta_A"] & data_row["beta_A"] <= current2)
    data_row["coverage_plug_in"] <- as.numeric(current3 <= data_row["beta_A"] & data_row["beta_A"] <= current4)
    influence_loss <<- append(influence_loss, abs(current5 - current1) + abs(current6 - current2))
    plug_in_loss <<- append(plug_in_loss, abs(current5 - current3) + abs(current6 - current4))
    influence_values <<- append(influence_values, list(c(current1, current2)))
    plug_models <<- append(plug_models, list(c(current3, current4)))
    return(data_row)
  }
  # Apply function across each observation where E == 0
  data[data$E == 0, ] <- t(apply(data[data$E == 0, ], 1, compute_influence))
  
  
  
  
  # Convert the list to a numeric vector
  influence_vector <- unlist(influence_values)
  plug_model_vector <- unlist(plug_models)
  influence_loss <- unlist(influence_loss)
  plug_in_loss <- unlist(plug_in_loss)
  
  print(mean(influence_loss))
  print(mean(plug_in_loss))
  
  
 
  
  
  outer_influence_values <- append(outer_influence_values, list(influence_vector))
  outer_plug_in_bounds <- append(outer_plug_in_bounds, list(plug_model_vector))
  outer_prob_df <- append(outer_prob_df, list(prob_df))
  outer_influence_loss <- append(outer_influence_loss, list(mean(influence_loss)))
  outer_plug_in_loss <- append(outer_plug_in_loss, list(mean(plug_in_loss)))
  outer_mae_propensity <- append(outer_mae_propensity, list(mae_propensity))
  outer_mae_outcome <- append(outer_mae_outcome, list(mae_outcome))
  outer_mae_probs <- append(outer_mae_probs, list(mae_probs))
  outer_data <- append(outer_data, list(data))
  outer_alpha <- append(outer_alpha, list(alpha))
  outer_delta <- append(outer_delta, list(delta))
}
