clear all;
clc;
num_vertices_range = 10:300:2300;
p_fixed = 0.2;
q_fixed = 0.165;
num_iterations = 1;
rng(45);
time_spectral = zeros(num_iterations, length(num_vertices_range));
time_corr = zeros(num_iterations, length(num_vertices_range));
time_corr_selfloop = zeros(num_iterations, length(num_vertices_range));

for idx = 1:length(num_vertices_range)
    n = num_vertices_range(idx);
    group_labels = repelem([1, 2], n/2);
    time_spectral_iter = zeros(1, num_iterations);
    time_corr_iter = zeros(1, num_iterations);
    time_corr_selfloop_iter = zeros(1, num_iterations);

    for iter = 1:num_iterations
        [s_G, t_G, weights_G, ~] = stochastic_block_model(n, p_fixed, q_fixed, group_labels);
        G = graph(s_G, t_G, weights_G, n);
        [s_H, t_H, weights_H, ~] = stochastic_block_model(n, q_fixed, p_fixed, group_labels);
        H = graph(s_H, t_H, weights_H, n);

        tic;
        [clusters_spectral, ~, ~] = spectral_clustering(s_G, t_G, weights_G);
        time_spectral_iter(iter) = toc;

        L_G = compute_normalized_laplacian(s_G, t_G, weights_G, n);
        L_H = compute_normalized_laplacian(s_H, t_H, weights_H, n);
        tic;
        [~, ~, ~, ~, ~] = generalized_eigenvalue_spectrum_with_quadratic_forms(L_G, L_H);
        time_corr_iter(iter) = toc;

        s_H_selfloop = [s_H; 1];
        t_H_selfloop = [t_H; 1];
        weights_H_selfloop = [weights_H; 0.1];
        L_H_selfloop = compute_normalized_laplacian(s_H_selfloop, t_H_selfloop, weights_H_selfloop, n);
        tic;
        [~, ~, ~, ~, ~] = generalized_eigenvalue_spectrum_with_quadratic_forms(L_G, L_H_selfloop, true);
        time_corr_selfloop_iter(iter) = toc;
    end
    
    time_spectral(:, idx) = mean(time_spectral_iter);
    time_corr(:, idx) = mean(time_corr_iter);
    time_corr_selfloop(:, idx) = mean(time_corr_selfloop_iter);
end

fprintf('Vertices\t Spectral Clustering\t Correlation Clustering\t Correlation Clustering with Self-loops\n');
for i = 1:length(num_vertices_range)
    fprintf('%d\t\t %.4f seconds\t\t\t %.4f seconds\t\t\t %.4f seconds\n', ...
        num_vertices_range(i), time_spectral(i), time_corr(i), time_corr_selfloop(i));
end

figure;
plot(num_vertices_range, time_corr, '-s', 'LineWidth', 2, 'Color', [0.8500 0.3250 0.0980], 'DisplayName', 'CC');
hold on;
plot(num_vertices_range, time_corr_selfloop, '-d', 'LineWidth', 2, 'Color', [0 0.4470 0.7410], 'DisplayName', 'CC++');
hold on;
plot(num_vertices_range, time_spectral, '-o', 'LineWidth', 2, 'DisplayName', 'SC');
hold on;
xlabel('Number of Vertices', 'FontSize', 14, 'FontWeight', 'bold');
ylabel('Mean Execution Time (seconds)', 'FontSize', 14, 'FontWeight', 'bold');
title('Mean Execution Time vs Number of Vertices', 'FontSize', 16, 'FontWeight', 'bold');
legend('Location', 'Best', 'FontSize', 12);
grid on;
ax = gca;
ax.GridLineStyle = '--';
ax.GridAlpha = 0.7;
ax.FontSize = 12;
ax.LineWidth = 1.5;
box on;
xlim([10, 2110])







function [sorted_eigenvalues, sorted_eigenvectors, quadratic_forms, selected_eigenvector, cluster_labels] = generalized_eigenvalue_spectrum_with_quadratic_forms(L_G, L_H, try_cholesky)
    if nargin < 3 || isempty(try_cholesky)
        try_cholesky = false;
    end
    threshold = 1e-6;
    if try_cholesky
        try
            [eigenvectors, eigenvalues] = eig(L_G, L_H,"chol");
        catch
            [eigenvectors, eigenvalues] = eig(L_G, L_H,"qz");
        end
    else
        [eigenvectors, eigenvalues] = eig(L_G, L_H,"qz");
    end
    eigenvalues_diag = diag(eigenvalues);
    [sorted_eigenvalues, idx] = sort(eigenvalues_diag, 'ascend');
    sorted_eigenvectors = eigenvectors(:, idx);
    valid_indices = ~isinf(sorted_eigenvalues) & ~isnan(sorted_eigenvalues);
    sorted_eigenvalues = sorted_eigenvalues(valid_indices);
    sorted_eigenvectors = sorted_eigenvectors(:, valid_indices);
    quadratic_forms = zeros(length(sorted_eigenvalues), 1);
    for i = 1:length(sorted_eigenvalues)
        x = sorted_eigenvectors(:, i);
        numerator = x' * L_G * x;
        denominator = x' * L_H * x;
        if denominator ~= 0
            quadratic_forms(i) = numerator / denominator;
        else
            quadratic_forms(i) = NaN;
        end
    end
    if length(sorted_eigenvalues) >= 2 && sorted_eigenvalues(2) > threshold
        selected_eigenvector = sorted_eigenvectors(:, 2);
    else
        idx_above_threshold = find(sorted_eigenvalues > threshold, 1, 'first');
        if isempty(idx_above_threshold)
            error('No eigenvalues found above the specified threshold.');
        end
        selected_eigenvector = sorted_eigenvectors(:, idx_above_threshold);
    end
    selected_eigenvector = real(selected_eigenvector);
    cluster_labels = kmeans(selected_eigenvector, 2);
end
