import numpy as np
import torch
import torch.nn as nn
import torch.optim as optim
from sklearn.metrics import accuracy_score
import pandas as pd
from torch.utils.data import DataLoader, TensorDataset
from torch.optim.lr_scheduler import ReduceLROnPlateau

# Load data
train_data = np.load("./input/train_data.npy")
train_label = np.load("./input/train_label.npy")
val_data = np.load("./input/val_data.npy")
val_label = np.load("./input/val_label.npy")

# Normalize data
mean = train_data.mean(axis=0)
std = train_data.std(axis=0)

train_data_normalized = (train_data - mean) / std
val_data_normalized = (val_data - mean) / std


# Add Gaussian noise for data augmentation
def add_gaussian_noise(data, noise_factor=0.1):
    noise = np.random.normal(loc=0.0, scale=noise_factor, size=data.shape)
    return data + noise


train_data_augmented = add_gaussian_noise(train_data_normalized)

# Reshape data if necessary
X_train = torch.FloatTensor(
    train_data_augmented.reshape(train_data_augmented.shape[0], -1)
)
y_train = torch.LongTensor(train_label)
X_val = torch.FloatTensor(val_data_normalized.reshape(val_data_normalized.shape[0], -1))
y_val = torch.LongTensor(val_label)


# Define the neural network model with Batch Normalization and Dropout
class ImprovedNN(nn.Module):
    def __init__(self):
        super(ImprovedNN, self).__init__()
        self.fc1 = nn.Linear(X_train.shape[1], 256)
        self.bn1 = nn.BatchNorm1d(256)
        self.dropout1 = nn.Dropout(0.5)  # Dropout layer
        self.fc2 = nn.Linear(256, 128)
        self.bn2 = nn.BatchNorm1d(128)
        self.dropout2 = nn.Dropout(0.5)  # Dropout layer
        self.fc3 = nn.Linear(128, 64)
        self.bn3 = nn.BatchNorm1d(64)
        self.fc4 = nn.Linear(64, 18)  # 18 classes

    def forward(self, x):
        x = torch.relu(self.bn1(self.fc1(x)))
        x = self.dropout1(x)  # Apply dropout
        x = torch.relu(self.bn2(self.fc2(x)))
        x = self.dropout2(x)  # Apply dropout
        x = torch.relu(self.bn3(self.fc3(x)))
        x = self.fc4(x)
        return x


# Create DataLoader
train_dataset = TensorDataset(X_train, y_train)
train_loader = DataLoader(train_dataset, batch_size=64, shuffle=True)

# Initialize model, loss function, optimizer and scheduler
model = ImprovedNN()
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)
scheduler = ReduceLROnPlateau(optimizer, "min", patience=5, verbose=True)

# Training the model with increased epochs and early stopping
num_epochs = 50  # Increased number of epochs
best_val_loss = float("inf")
patience = 10
patience_counter = 0

for epoch in range(num_epochs):
    model.train()
    for inputs, labels in train_loader:
        optimizer.zero_grad()
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

    # Evaluating the model
    model.eval()
    with torch.no_grad():
        val_outputs = model(X_val)
        val_loss = criterion(val_outputs, y_val)
        _, predicted = torch.max(val_outputs, 1)
        accuracy = accuracy_score(y_val.numpy(), predicted.numpy())

    # Adjust learning rate
    scheduler.step(val_loss)

    print(
        f"Epoch {epoch + 1}/{num_epochs}, Validation Loss: {val_loss.item():.4f}, Validation Accuracy: {accuracy:.4f}"
    )

    # Early stopping
    if val_loss < best_val_loss:
        best_val_loss = val_loss
        patience_counter = 0
    else:
        patience_counter += 1
        if patience_counter >= patience:
            print("Early stopping triggered.")
            break

# Save predictions to submission file
submission = pd.DataFrame({"Id": np.arange(len(predicted)), "Label": predicted.numpy()})
submission.to_csv("./working/submission.csv", index=False)

# Print the final evaluation metric
print(f"Final Validation Accuracy: {accuracy:.4f}")
