library(xgboost)
library(data.table)
path="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/"
lst=list()
for ( k in 1:10){



  X_train  <-as.matrix( fread(paste0(path,"data_split/Airpassenger/X_train",k,".csv")))

  y_train  <- as.matrix( fread(paste0(path,"data_split/Airpassenger/y_train",k,".csv")))
  X_test   <- as.matrix(fread(paste0(path,"data_split/Airpassenger/X_test",k,".csv")))
  y_test   <- as.matrix(fread(paste0(path,"data_split/Airpassenger/y_test",k,".csv")))

  dtrain <- xgb.DMatrix(data = X_train, label = y_train)

  params <- list(
    objective = "reg:squarederror",  # For regression
    eval_metric = "rmse"
  )
  xgb_model <- xgb.train(
    params = params,
    data = dtrain,
    nrounds = 50
  )
  dtest <- xgb.DMatrix(data = X_train)
  y_pred <- predict(xgb_model, dtest)

  rmse <- sqrt(mean((y_pred -y_test)^2))
lst[[k]]=c(rmse,mad((y_pred -y_test)))
}

save(lst, file="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/results_realdata/Airpassenger_xgboost.RData")


#SNP500

lst= list()
for (k in 1:10){
  X_train  <- as.matrix(fread(paste0(path,"data_split/SNP500/X_train",k,".csv")))
  X_test   <- as.matrix(fread(paste0(path,"data_split/SNP500/X_test",k,".csv")))
  y_test   <- as.matrix(fread(paste0(path,"data_split/SNP500/y_test",k,".csv")))
  y_train  <- as.matrix(fread(paste0(path,"data_split/SNP500/y_train",k,".csv")))

  dtrain <- xgb.DMatrix(data = X_train, label = y_train)

  params <- list(
    objective = "reg:squarederror",  # For regression
    eval_metric = "rmse"
  )
  xgb_model <- xgb.train(
    params = params,
    data = dtrain,
    nrounds = 50
  )
  dtest <- xgb.DMatrix(data =X_test)
  y_pred <- predict(xgb_model, dtest)
  rmse <- sqrt(mean((y_pred -y_test)^2))
  lst[[k]]=c(rmse,mad((y_pred -y_test)))
}

save(lst, file="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/results_realdata/SNP500_xgboost.RData")






#spaRNAseq -----





lst= list()
for (k in 1:10){
  X_train  <- as.matrix(fread(paste0(path,"data_split/spaRNA_seq/X_train",k,".csv")))
  X_test   <- as.matrix(fread(paste0(path,"data_split/spaRNA_seq/X_test",k,".csv")))
  y_test   <- as.matrix(fread(paste0(path,"data_split/spaRNA_seq/y_test",k,".csv")))
  y_train  <- as.matrix(fread(paste0(path,"data_split/spaRNA_seq/y_train",k,".csv")))

  dtrain <- xgb.DMatrix(data = X_train, label = y_train)

  params <- list(
    objective = "reg:squarederror",  # For regression
    eval_metric = "rmse"
  )
  xgb_model <- xgb.train(
    params = params,
    data = dtrain,
    nrounds = 50
  )
  dtest <- xgb.DMatrix(data = X_test)
  y_pred <- predict(xgb_model, dtest)
  rmse <- sqrt(mean((y_pred -y_test)^2))
  lst[[k]]=c(rmse,mad((y_pred -y_test)))
}

save(lst, file="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/results_realdata/spRNA_seq_xgboost.RData")






#TCGA  -----





lst= list()
for (k in 1:10){
  X_train  <- as.matrix(fread(paste0(path,"data_split/TCGA/X_train",k,".csv")))
  X_test   <- as.matrix(fread(paste0(path,"data_split/TCGA/X_test",k,".csv")))
  y_test   <- as.matrix(fread(paste0(path,"data_split/TCGA/y_test",k,".csv")))
  y_train  <- as.matrix(fread(paste0(path,"data_split/TCGA/y_train",k,".csv")))

  dtrain <- xgb.DMatrix(data = X_train, label = y_train)

  params <- list(
    objective = "reg:squarederror",  # For regression
    eval_metric = "rmse"
  )
  xgb_model <- xgb.train(
    params = params,
    data = dtrain,
    nrounds = 50
  )
  dtest <- xgb.DMatrix(data = X_test)
  y_pred <- predict(xgb_model, dtest)
  rmse <- sqrt(mean((y_pred -y_test)^2))
  lst[[k]]=c(rmse,mad((y_pred -y_test)))
}

save(lst, file="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/results_realdata/TCGA_xgboost.RData")




#age clock

lst= list()
for (k in 1:10){
  X_train  <- as.matrix(fread(paste0(path,"data_split/GSE40279/X_train",k,".csv")))
  X_test   <- as.matrix(fread(paste0(path,"data_split/GSE40279/X_test",k,".csv")))
  y_test   <- as.matrix(fread(paste0(path,"data_split/GSE40279/y_test",k,".csv")))
  y_train  <- as.matrix(fread(paste0(path,"data_split/GSE40279/y_train",k,".csv")))

  dtrain <- xgb.DMatrix(data = X_train, label = y_train)

  params <- list(
    objective = "reg:squarederror",  # For regression
    eval_metric = "rmse"
  )
  xgb_model <- xgb.train(
    params = params,
    data = dtrain,
    nrounds = 50
  )
  dtest <- xgb.DMatrix(data = X_test)
  y_pred <- predict(xgb_model, dtest)
  rmse <- sqrt(mean((y_pred -y_test))^2)
  lst[[k]]=c(rmse,mad((y_pred -y_test)))
}

save(lst, file="C:/Document/Serieux/Travail/Data_analysis_and_papers/nash_experiement/results_realdata/GSE40279_xgboost.RData")






