{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "cells": [
    {
      "cell_type": "code",
      "source": [
        "import pandas as pd\n",
        "import numpy as np\n",
        "\n",
        "# Load the three CSV files\n",
        "nrms_df = pd.read_csv('NRMS_sliding.csv')\n",
        "ebnr_df = pd.read_csv('EBNR_sliding.csv')\n",
        "naml_df = pd.read_csv('NAML_sliding.csv')\n",
        "\n",
        "def calculate_full_stats(values, metric_name, model_name):\n",
        "    \"\"\"Calculate comprehensive statistics for all values (including zeros)\"\"\"\n",
        "    stats = {\n",
        "        'model': model_name,\n",
        "        'metric': metric_name,\n",
        "        'count': len(values),\n",
        "        'max': np.max(values),\n",
        "        'min': np.min(values),\n",
        "        'variance': np.var(values),\n",
        "        'std': np.std(values),\n",
        "        'mean': np.mean(values),\n",
        "        'median': np.median(values),\n",
        "        'q1': np.percentile(values, 25),\n",
        "        'q3': np.percentile(values, 75),\n",
        "        'non_zero_count': np.sum(values > 0),\n",
        "        'zero_count': np.sum(values == 0),\n",
        "        'non_zero_percentage': (np.sum(values > 0) / len(values)) * 100\n",
        "    }\n",
        "    return stats\n",
        "\n",
        "# Define metrics to analyze\n",
        "metrics = ['MRR', 'nDCG@5', 'nDCG@10']\n",
        "models_data = [('NRMS', nrms_df), ('EBNR', ebnr_df), ('NAML', naml_df)]\n",
        "\n",
        "# Store all statistics\n",
        "all_stats = []\n",
        "\n",
        "# Calculate statistics for each metric and model\n",
        "for metric in metrics:\n",
        "    print(f\"{metric} STATISTICS (ALL VALUES):\")\n",
        "    print(\"=\" * 60)\n",
        "\n",
        "    metric_stats = []\n",
        "    for model_name, df in models_data:\n",
        "        values = df[metric].values\n",
        "        stats = calculate_full_stats(values, metric, model_name)\n",
        "        metric_stats.append(stats)\n",
        "        all_stats.append(stats)\n",
        "\n",
        "        print(f\"\\n{model_name}:\")\n",
        "        print(f\"  Count: {stats['count']}\")\n",
        "        print(f\"  Max: {stats['max']:.8f}\")\n",
        "        print(f\"  Min: {stats['min']:.8f}\")\n",
        "        print(f\"  Variance: {stats['variance']:.10f}\")\n",
        "        print(f\"  Std Dev: {stats['std']:.8f}\")\n",
        "        print(f\"  Mean: {stats['mean']:.8f}\")\n",
        "        print(f\"  Median: {stats['median']:.8f}\")\n",
        "        print(f\"  Q1 (25th percentile): {stats['q1']:.8f}\")\n",
        "        print(f\"  Q3 (75th percentile): {stats['q3']:.8f}\")\n",
        "        print(f\"  Non-zero values: {stats['non_zero_count']} ({stats['non_zero_percentage']:.3f}%)\")\n",
        "        print(f\"  Zero values: {stats['zero_count']}\")\n",
        "\n",
        "    print(\"\\n\")\n",
        "\n",
        "# Create comprehensive comparison table\n",
        "print(\"\\nCOMPREHENSIVE COMPARISON TABLE:\")\n",
        "print(\"=\" * 120)\n",
        "print(f\"{'Metric':<10} {'Model':<6} {'Max':<12} {'Min':<12} {'Variance':<15} {'Std Dev':<12} {'Mean':<12} {'Non-Zero %':<10}\")\n",
        "print(\"-\" * 120)\n",
        "\n",
        "for stats in all_stats:\n",
        "    print(f\"{stats['metric']:<10} {stats['model']:<6} {stats['max']:<12.8f} \"\n",
        "          f\"{stats['min']:<12.8f} {stats['variance']:<15.10f} {stats['std']:<12.8f} \"\n",
        "          f\"{stats['mean']:<12.8f} {stats['non_zero_percentage']:<10.2f}%\")\n",
        "\n",
        "# Find best performers for each metric\n",
        "print(\"\\n\\nBEST PERFORMERS BY METRIC:\")\n",
        "print(\"=\" * 50)\n",
        "\n",
        "for metric in metrics:\n",
        "    metric_data = [s for s in all_stats if s['metric'] == metric]\n",
        "\n",
        "    # Highest max value\n",
        "    best_max = max(metric_data, key=lambda x: x['max'])\n",
        "    # Highest mean value\n",
        "    best_mean = max(metric_data, key=lambda x: x['mean'])\n",
        "    # Highest variance (most variable)\n",
        "    highest_var = max(metric_data, key=lambda x: x['variance'])\n",
        "    # Lowest variance (most consistent)\n",
        "    lowest_var = min(metric_data, key=lambda x: x['variance'])\n",
        "\n",
        "    print(f\"\\n{metric}:\")\n",
        "    print(f\"  Highest Max: {best_max['model']} ({best_max['max']:.6f})\")\n",
        "    print(f\"  Highest Mean: {best_mean['model']} ({best_mean['mean']:.6f})\")\n",
        "    print(f\"  Highest Variance: {highest_var['model']} ({highest_var['variance']:.8f})\")\n",
        "    print(f\"  Lowest Variance: {lowest_var['model']} ({lowest_var['variance']:.8f})\")\n",
        "\n",
        "# Summary statistics across all metrics\n",
        "print(\"\\n\\nSUMMARY STATISTICS ACROSS ALL METRICS:\")\n",
        "print(\"=\" * 55)\n",
        "\n",
        "for model_name, _ in models_data:\n",
        "    model_stats = [s for s in all_stats if s['model'] == model_name]\n",
        "\n",
        "    total_variance = sum(s['variance'] for s in model_stats)\n",
        "    avg_mean = np.mean([s['mean'] for s in model_stats])\n",
        "    avg_nonzero_pct = np.mean([s['non_zero_percentage'] for s in model_stats])\n",
        "\n",
        "    print(f\"\\n{model_name}:\")\n",
        "    print(f\"  Total Variance (sum): {total_variance:.10f}\")\n",
        "    print(f\"  Average Mean: {avg_mean:.8f}\")\n",
        "    print(f\"  Average Non-zero %: {avg_nonzero_pct:.2f}%\")\n",
        "\n",
        "# Optional: Export all results to CSV\n",
        "\"\"\"\n",
        "import pandas as pd\n",
        "\n",
        "# Convert results to DataFrame\n",
        "results_df = pd.DataFrame(all_stats)\n",
        "\n",
        "# Reorder columns for better readability\n",
        "column_order = ['model', 'metric', 'count', 'max', 'min', 'variance', 'std',\n",
        "                'mean', 'median', 'q1', 'q3', 'non_zero_count', 'zero_count', 'non_zero_percentage']\n",
        "results_df = results_df[column_order]\n",
        "\n",
        "# Save to CSV\n",
        "results_df.to_csv('comprehensive_metrics_statistics.csv', index=False)\n",
        "print('Results saved to comprehensive_metrics_statistics.csv')\n",
        "\n",
        "# Display the DataFrame\n",
        "print(results_df.to_string(index=False))\n",
        "\"\"\"\n"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 1000
        },
        "id": "Z5zuPKeaEK1N",
        "outputId": "15909a98-cb84-4e47-c7fe-9df8f7d3c5ef"
      },
      "execution_count": 3,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "MRR STATISTICS (ALL VALUES):\n",
            "============================================================\n",
            "\n",
            "NRMS:\n",
            "  Count: 20600\n",
            "  Max: 0.50000000\n",
            "  Min: 0.00010048\n",
            "  Variance: 0.0000688083\n",
            "  Std Dev: 0.00829508\n",
            "  Mean: 0.00091166\n",
            "  Median: 0.00020115\n",
            "  Q1 (25th percentile): 0.00013394\n",
            "  Q3 (75th percentile): 0.00039793\n",
            "  Non-zero values: 20600 (100.000%)\n",
            "  Zero values: 0\n",
            "\n",
            "EBNR:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00010048\n",
            "  Variance: 0.0001025064\n",
            "  Std Dev: 0.01012454\n",
            "  Mean: 0.00097509\n",
            "  Median: 0.00019992\n",
            "  Q1 (25th percentile): 0.00013367\n",
            "  Q3 (75th percentile): 0.00040197\n",
            "  Non-zero values: 20600 (100.000%)\n",
            "  Zero values: 0\n",
            "\n",
            "NAML:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00010048\n",
            "  Variance: 0.0002672119\n",
            "  Std Dev: 0.01634662\n",
            "  Mean: 0.00110226\n",
            "  Median: 0.00020024\n",
            "  Q1 (25th percentile): 0.00013378\n",
            "  Q3 (75th percentile): 0.00040036\n",
            "  Non-zero values: 20600 (100.000%)\n",
            "  Zero values: 0\n",
            "\n",
            "\n",
            "nDCG@5 STATISTICS (ALL VALUES):\n",
            "============================================================\n",
            "\n",
            "NRMS:\n",
            "  Count: 20600\n",
            "  Max: 0.63092975\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0001002905\n",
            "  Std Dev: 0.01001451\n",
            "  Mean: 0.00019466\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 8 (0.039%)\n",
            "  Zero values: 20592\n",
            "\n",
            "EBNR:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0001492043\n",
            "  Std Dev: 0.01221492\n",
            "  Mean: 0.00029002\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 13 (0.063%)\n",
            "  Zero values: 20587\n",
            "\n",
            "NAML:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0003102426\n",
            "  Std Dev: 0.01761371\n",
            "  Mean: 0.00042763\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 14 (0.068%)\n",
            "  Zero values: 20586\n",
            "\n",
            "\n",
            "nDCG@10 STATISTICS (ALL VALUES):\n",
            "============================================================\n",
            "\n",
            "NRMS:\n",
            "  Count: 20600\n",
            "  Max: 0.63092975\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0001663216\n",
            "  Std Dev: 0.01289658\n",
            "  Mean: 0.00039843\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 21 (0.102%)\n",
            "  Zero values: 20579\n",
            "\n",
            "EBNR:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0002156523\n",
            "  Std Dev: 0.01468511\n",
            "  Mean: 0.00049450\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 26 (0.126%)\n",
            "  Zero values: 20574\n",
            "\n",
            "NAML:\n",
            "  Count: 20600\n",
            "  Max: 1.00000000\n",
            "  Min: 0.00000000\n",
            "  Variance: 0.0003970592\n",
            "  Std Dev: 0.01992634\n",
            "  Mean: 0.00070290\n",
            "  Median: 0.00000000\n",
            "  Q1 (25th percentile): 0.00000000\n",
            "  Q3 (75th percentile): 0.00000000\n",
            "  Non-zero values: 32 (0.155%)\n",
            "  Zero values: 20568\n",
            "\n",
            "\n",
            "\n",
            "COMPREHENSIVE COMPARISON TABLE:\n",
            "========================================================================================================================\n",
            "Metric     Model  Max          Min          Variance        Std Dev      Mean         Non-Zero %\n",
            "------------------------------------------------------------------------------------------------------------------------\n",
            "MRR        NRMS   0.50000000   0.00010048   0.0000688083    0.00829508   0.00091166   100.00    %\n",
            "MRR        EBNR   1.00000000   0.00010048   0.0001025064    0.01012454   0.00097509   100.00    %\n",
            "MRR        NAML   1.00000000   0.00010048   0.0002672119    0.01634662   0.00110226   100.00    %\n",
            "nDCG@5     NRMS   0.63092975   0.00000000   0.0001002905    0.01001451   0.00019466   0.04      %\n",
            "nDCG@5     EBNR   1.00000000   0.00000000   0.0001492043    0.01221492   0.00029002   0.06      %\n",
            "nDCG@5     NAML   1.00000000   0.00000000   0.0003102426    0.01761371   0.00042763   0.07      %\n",
            "nDCG@10    NRMS   0.63092975   0.00000000   0.0001663216    0.01289658   0.00039843   0.10      %\n",
            "nDCG@10    EBNR   1.00000000   0.00000000   0.0002156523    0.01468511   0.00049450   0.13      %\n",
            "nDCG@10    NAML   1.00000000   0.00000000   0.0003970592    0.01992634   0.00070290   0.16      %\n",
            "\n",
            "\n",
            "BEST PERFORMERS BY METRIC:\n",
            "==================================================\n",
            "\n",
            "MRR:\n",
            "  Highest Max: EBNR (1.000000)\n",
            "  Highest Mean: NAML (0.001102)\n",
            "  Highest Variance: NAML (0.00026721)\n",
            "  Lowest Variance: NRMS (0.00006881)\n",
            "\n",
            "nDCG@5:\n",
            "  Highest Max: EBNR (1.000000)\n",
            "  Highest Mean: NAML (0.000428)\n",
            "  Highest Variance: NAML (0.00031024)\n",
            "  Lowest Variance: NRMS (0.00010029)\n",
            "\n",
            "nDCG@10:\n",
            "  Highest Max: EBNR (1.000000)\n",
            "  Highest Mean: NAML (0.000703)\n",
            "  Highest Variance: NAML (0.00039706)\n",
            "  Lowest Variance: NRMS (0.00016632)\n",
            "\n",
            "\n",
            "SUMMARY STATISTICS ACROSS ALL METRICS:\n",
            "=======================================================\n",
            "\n",
            "NRMS:\n",
            "  Total Variance (sum): 0.0003354205\n",
            "  Average Mean: 0.00050159\n",
            "  Average Non-zero %: 33.38%\n",
            "\n",
            "EBNR:\n",
            "  Total Variance (sum): 0.0004673631\n",
            "  Average Mean: 0.00058654\n",
            "  Average Non-zero %: 33.40%\n",
            "\n",
            "NAML:\n",
            "  Total Variance (sum): 0.0009745138\n",
            "  Average Mean: 0.00074426\n",
            "  Average Non-zero %: 33.41%\n"
          ]
        },
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "\"\\nimport pandas as pd\\n\\n# Convert results to DataFrame\\nresults_df = pd.DataFrame(all_stats)\\n\\n# Reorder columns for better readability\\ncolumn_order = ['model', 'metric', 'count', 'max', 'min', 'variance', 'std', \\n                'mean', 'median', 'q1', 'q3', 'non_zero_count', 'zero_count', 'non_zero_percentage']\\nresults_df = results_df[column_order]\\n\\n# Save to CSV\\nresults_df.to_csv('comprehensive_metrics_statistics.csv', index=False)\\nprint('Results saved to comprehensive_metrics_statistics.csv')\\n\\n# Display the DataFrame\\nprint(results_df.to_string(index=False))\\n\""
            ],
            "application/vnd.google.colaboratory.intrinsic+json": {
              "type": "string"
            }
          },
          "metadata": {},
          "execution_count": 3
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [],
      "metadata": {
        "id": "vO-u5NzwL9UC"
      },
      "execution_count": null,
      "outputs": []
    }
  ]
}