#==============================================================================
# Vecchia for 1D synthetic function 
# Mark Risser
# Lawrence Berkeley National Laboratory
# May, 2025
#==============================================================================

set.seed(0)

# Setup / load data
library(GpGp)
y <- read.csv("1d_function/y_train_1d.csv", header = FALSE)$V1
ytest <- read.csv("1d_function/y_test_1d.csv", header = FALSE)$V1
x <- as.matrix(read.csv("1d_function/x_train_1d.csv", header = FALSE))
xtest <- as.matrix(read.csv("1d_function/x_test_1d.csv", header = FALSE))

# Training
# Note: below, 'fixed_parms = c(3,4)' means the Matern smoothness (10) and 
#       noise variance (0.01) are fixed and not trained.
prt <- proc.time()
fit <- fit_model(y = y, locs = x, m_seq = 30, start_parms = c(1, 0.1, 10, 0.01), fixed_parms = c(3,4), silent = TRUE)
print(paste0("Training time: ", (proc.time() - prt)[3], " seconds"))
print(summary(fit))
prt <- proc.time()
ypred <- predictions(fit = fit, locs_pred = xtest, X_pred = matrix(1, ncol=1, nrow=nrow(xtest)))
ypred_condsim <- cond_sim( fit, locs_pred = xtest, X_pred = matrix(1, ncol=1, nrow=nrow(xtest)), nsims = 200 )
ypred_se <- rep(NA, length(ypred))
for(j in 1:length(ypred)){
  ypred_se[j] <- sqrt( mean( (ypred_condsim[j,] - ypred[j] )^2 ) )
}
print(paste0("Prediction time for test points: ", (proc.time() - prt)[3], " seconds"))

# RMSE
print(paste0("RMSE: ", round(sqrt(mean((ypred - ytest)^2)), 4)))

# Write results to CSV
results_1d <- data.frame( x_test = as.numeric(xtest), y_test = ypred, y_standard_dev = ypred_se)
write.csv(results_1d, file = "vecchia_1d_results_final.csv", row.names = FALSE)