from sklearn.model_selection import train_test_split
from sklearn.svm import SVC
import numpy as np
# from Deep_ICE_array_complement import Deep_ICE
from sklearn.svm import SVC
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from sklearn.preprocessing import StandardScaler
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.linear_model import LogisticRegression
from E01_ICE import E01_ICE
from auxfuncs_array import pred_linear
from ICE_coreset import coreset_while
import torch


data = np.loadtxt("datasets/spesis_975_3D.csv", delimiter=",")

data = np.unique(data, axis=0)

X = data[:,:-1]
y = data[:,-1]
N,D = X .shape

X = np.unique(X, axis=0)
y[y==0] = -1
y = y.astype(int)


# normalize and add noise to the dataset
min_val = X.min(axis=0)   # Minimum value of each column
max_val = X.max(axis=0)   # Maximum value of each column
epsilon = 1e-8
X = 2 * (X - min_val) / (max_val - min_val+epsilon) - 1

np.random.seed(2024)
noise_std_dev = 1e-8 # Suitable noise standard deviation
noise = np.random.normal(0, noise_std_dev, size=X.shape)
X = X + noise


X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2)
N_train = X_train.shape[0]
N_test = X_test.shape[0]
print(f'The number of training samples is {N_train}, the number of test samples is {N_test}')


#### SVM
svm = SVC(kernel='linear', C=1.0)  # C is the regularization parameter
svm.fit(X_train, y_train)

y_pred_train = svm.predict(X_train)
train_acc_svm = accuracy_score(y_pred_train, y_train)
y_pred_test = svm.predict(X_test)
test_acc_svm = accuracy_score(y_pred_test, y_test)
print(f"SVM: Train Accuracy: {train_acc_svm:.4f}, Test Accuracy: {test_acc_svm:.4f}")

#### logstic regression

log_reg = LogisticRegression(multi_class='ovr', random_state=42)
log_reg.fit(X_train, y_train)
y_pred_train = log_reg.predict(X_train)
train_acc_log_reg = accuracy_score(y_pred_train, y_train)


y_pred_test = log_reg.predict(X_test)
test_acc_log_reg = accuracy_score(y_pred_test, y_test)
print(f"Logistic-regression: Train Accuracy: {train_acc_log_reg:.4f}, Test Accuracy: {test_acc_log_reg:.4f}")



####  LDA results
lda = LinearDiscriminantAnalysis()
lda.fit(X_train, y_train)
y_pred_train = lda.predict(X_train)
train_acc_lda = accuracy_score(y_pred_train, y_train)


y_pred_test = lda.predict(X_test)
test_acc_lda = accuracy_score(y_pred_test, y_test)
print(f"LDA: Train Accuracy: {train_acc_lda:.4f}, Test Accuracy: {test_acc_lda:.4f}")

#### Exact_ICE

inds = [i for i in range(N_train)]
res = E01_ICE(inds, X_train, y_train, 1,  int(5e3), 'cuda', verbose=False)

w = res[0]

train_loss = res[1].item()
train_acc_ice = 1 - train_loss/N_train


y_pred_test = pred_linear(X_test, w)
y_test = torch.tensor(y_test)
loss_test = torch.sum(y_pred_test!=y_test)
if loss_test > y_test.shape[0]/2:
    loss_test = torch.sum((-y_pred_test)!=y_test)
test_acc_ice = 1 - loss_test/N_test

print(f"ICE: Train Accuracy: {train_acc_ice:.4f}, Test Accuracy: {test_acc_ice:.4f}")

