import numpy as np
import anndata
import os
from sklearn.manifold import TSNE

# Load the data
adata = anndata.read_h5ad(os.path.join("./input", "5k_pbmc_processed.h5ad"))

# Apply t-SNE for dimensionality reduction with random initialization
tsne = TSNE(n_components=2, random_state=42, init="random")
adata.obsm["X_emb"] = tsne.fit_transform(adata.X)


# Evaluation functions
def _distance_correlation(X, X_emb):
    import scipy.spatial
    import scipy.stats

    high_dimensional_distance_vector = scipy.spatial.distance.pdist(X)
    low_dimensional_distance_vector = scipy.spatial.distance.pdist(X_emb)
    return scipy.stats.spearmanr(
        low_dimensional_distance_vector, high_dimensional_distance_vector
    )[0]


def distance_correlation(adata, n_svd=500):
    import sklearn.decomposition

    X = adata.X
    if n_svd < min(X.shape):
        X = sklearn.decomposition.TruncatedSVD(n_svd).fit_transform(X)
    else:
        X = X.toarray()
    return _distance_correlation(X, adata.obsm["X_emb"])


def trustworthiness(adata):
    from sklearn import manifold

    high_dim, low_dim = adata.X, adata.obsm["X_emb"]
    score = manifold.trustworthiness(
        high_dim, low_dim, n_neighbors=15, metric="euclidean"
    )
    return float(np.clip(score, 0, 1))


def evaluate(adata):
    tw = trustworthiness(adata)
    dc = distance_correlation(adata)
    val_metric = (tw + dc) / 2
    return val_metric


# Compute evaluation metric
evaluation_metric = evaluate(adata)
print("Evaluation Metric:", evaluation_metric)

# Save the results
submission_path = os.path.join("./working", "submission.csv")
np.savetxt(submission_path, adata.obsm["X_emb"], delimiter=",")
