{
  "cells": [
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 1000
        },
        "id": "1I5-qRamGGz0",
        "outputId": "182d14cb-624b-493f-c889-ef8459e87231"
      },
      "outputs": [],
      "source": [
        "\"\"\"\n",
        "Self-contained script to reproduce the dimension comparison experiment.\n",
        "This script includes all necessary imports, class definitions, and experiment code.\n",
        "\"\"\"\n",
        "\n",
        "import numpy as np\n",
        "import matplotlib.pyplot as plt\n",
        "import seaborn as sns\n",
        "import pandas as pd\n",
        "import sys\n",
        "import os\n",
        "from scipy.special import zeta\n",
        "\n",
        "# Set random seed for reproducibility\n",
        "np.random.seed(42)\n",
        "\n",
        "# Font size parameters for easy tuning\n",
        "TITLE_FONTSIZE = 22\n",
        "SUBTITLE_FONTSIZE = 22\n",
        "AXIS_LABEL_FONTSIZE = 18\n",
        "TICK_LABEL_FONTSIZE = 18\n",
        "LEGEND_FONTSIZE = 18\n",
        "ANNOTATION_FONTSIZE = 18\n",
        "\n",
        "# Constants\n",
        "MAX_K = 100\n",
        "\n",
        "def muu(k, alpha=0.99):\n",
        "    return alpha ** k + 1e-10\n",
        "\n",
        "# Base estimator class\n",
        "class GradEstimator:\n",
        "    \"\"\"Base class for gradient estimators.\"\"\"\n",
        "\n",
        "    def __init__(self, zoo_batch_size=16, mu=1e-6):\n",
        "        \"\"\"Initialize a gradient estimator.\n",
        "\n",
        "        Args:\n",
        "            zoo_batch_size (int, optional): The batch size for gradient estimation. Defaults to 16.\n",
        "            mu (float, optional): The perturbation size. Defaults to 1e-6.\n",
        "        \"\"\"\n",
        "        self.zoo_batch_size = zoo_batch_size\n",
        "        self.mu = mu\n",
        "        self._cost = 1  # Default cost is 1 function evaluation per gradient estimation\n",
        "\n",
        "    def generate_noise(self, x):\n",
        "        \"\"\"Generate noise for gradient estimation.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to estimate the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The noise vector.\n",
        "        \"\"\"\n",
        "        raise NotImplementedError(\"Subclasses must implement generate_noise\")\n",
        "\n",
        "    def estimate(self, f, x):\n",
        "        \"\"\"Estimate the gradient of a function at a point.\n",
        "\n",
        "        Args:\n",
        "            f (callable): The function to estimate the gradient for.\n",
        "            x (numpy.ndarray): The point at which to estimate the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The estimated gradient.\n",
        "        \"\"\"\n",
        "        raise NotImplementedError(\"Subclasses must implement estimate\")\n",
        "\n",
        "# Unbiased estimator implementation\n",
        "class UnbiasedEstimator(GradEstimator):\n",
        "    \"\"\"Unbiased estimator implementation.\n",
        "\n",
        "    This estimator uses a special technique to achieve unbiased gradient estimation.\n",
        "\n",
        "    Attributes:\n",
        "        zoo_batch_size (int): The batch size for gradient estimation.\n",
        "        mu (float): The perturbation size.\n",
        "        a (float): The parameter for the Zipf distribution.\n",
        "        P (int): The number of function evaluations per gradient estimation.\n",
        "        alpha (float): The parameter for the perturbation size.\n",
        "    \"\"\"\n",
        "\n",
        "    def __init__(self, P=4, zoo_batch_size=16, mu=1e-6, a=2.0, alpha=0.99):\n",
        "        \"\"\"Initialize an unbiased estimator.\n",
        "\n",
        "        Args:\n",
        "            P (int, optional): The number of function evaluations per gradient estimation. Defaults to 4.\n",
        "            zoo_batch_size (int, optional): The batch size for gradient estimation. Defaults to 16.\n",
        "            mu (float, optional): The perturbation size. Defaults to 1e-6.\n",
        "            a (float, optional): The parameter for the Zipf distribution. Defaults to 2.0.\n",
        "            alpha (float, optional): The parameter for the perturbation size. Defaults to 0.99.\n",
        "        \"\"\"\n",
        "        super().__init__(zoo_batch_size, mu)\n",
        "        self.a = a\n",
        "        assert P in [1,2,3,4], \"P must be 1, 2, 3, or 4\"\n",
        "        self.P = P\n",
        "        self._cost = P # cost is the number of function evaluations per gradient estimation\n",
        "        self.alpha = alpha\n",
        "\n",
        "    def generate_noise(self, x):\n",
        "        \"\"\"Generate uniform noise on the unit sphere.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to estimate the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The noise vector.\n",
        "        \"\"\"\n",
        "        ndim = len(x)\n",
        "        vec = np.random.randn(ndim)\n",
        "        vec /= np.linalg.norm(vec)\n",
        "        return vec * np.sqrt(ndim)\n",
        "\n",
        "    def P4_estimator(self, f, x):\n",
        "        grad = np.zeros_like(x)\n",
        "        delta = self.mu\n",
        "        _a = self.a\n",
        "\n",
        "        for i in range(self.zoo_batch_size):\n",
        "            v = self.generate_noise(x)\n",
        "\n",
        "            k = np.random.zipf(a=_a)\n",
        "            k = min(k, MAX_K)\n",
        "\n",
        "            # calculate a_1\n",
        "            noisy_x = x + delta * v\n",
        "            diff = f(noisy_x) - f(x)\n",
        "            a_1 = diff / delta / zeta(_a)\n",
        "            grad += a_1 * v\n",
        "\n",
        "            # calculate a_k\n",
        "            noisy_x = x + delta * v * muu(k-1)\n",
        "            diff_k = f(noisy_x) - f(x)\n",
        "            a_k = diff_k / delta / muu(k-1)\n",
        "\n",
        "            noisy_x = x + delta * v * muu(k)\n",
        "            diff_kk = f(noisy_x) - f(x)\n",
        "            a_kk = diff_kk / delta / muu(k)\n",
        "\n",
        "            # calculate derivative\n",
        "            p_k = k**-_a/zeta(_a)\n",
        "            dd = (a_kk - a_k) / p_k\n",
        "            grad += dd * v\n",
        "        return grad / self.zoo_batch_size\n",
        "\n",
        "    def P3_estimator(self, f, x):\n",
        "        grad = np.zeros_like(x)\n",
        "        delta = self.mu\n",
        "        _a = self.a\n",
        "\n",
        "        for i in range(self.zoo_batch_size):\n",
        "            v = self.generate_noise(x)\n",
        "            selection_variable = np.random.binomial(n=1, p=0.5)\n",
        "\n",
        "            k = np.random.zipf(a=_a)\n",
        "            k = min(k, MAX_K)\n",
        "\n",
        "            # calculate a_1\n",
        "            noisy_x = x + delta * v\n",
        "            diff = f(noisy_x) - f(x)\n",
        "            a_1 = diff / delta / zeta(_a)\n",
        "            grad += a_1 * v * selection_variable\n",
        "\n",
        "            # calculate a_k\n",
        "            noisy_x = x + delta * v * muu(k-1)\n",
        "            diff_k = f(noisy_x) - f(x)\n",
        "            a_k = diff_k / delta / muu(k-1)\n",
        "\n",
        "            noisy_x = x + delta * v * muu(k)\n",
        "            diff_kk = f(noisy_x) - f(x)\n",
        "            a_kk = diff_kk / delta / muu(k)\n",
        "\n",
        "            # calculate derivative\n",
        "            p_k = k**-_a/zeta(_a)\n",
        "            dd = (a_kk - a_k) / p_k\n",
        "            grad += dd * v * (1 - selection_variable)\n",
        "        return grad / self.zoo_batch_size\n",
        "\n",
        "    def P2_estimator(self, f, x):\n",
        "        # Not implemented in this example\n",
        "        raise NotImplementedError(\"P2_estimator not implemented\")\n",
        "\n",
        "    def P1_estimator(self, f, x):\n",
        "        # Not implemented in this example\n",
        "        raise NotImplementedError(\"P1_estimator not implemented\")\n",
        "\n",
        "    def estimate(self, f, x):\n",
        "        if self.P == 4:\n",
        "            return self.P4_estimator(f, x)\n",
        "        elif self.P == 3:\n",
        "            return self.P3_estimator(f, x)\n",
        "        elif self.P == 2:\n",
        "            return self.P2_estimator(f, x)\n",
        "        elif self.P == 1:\n",
        "            return self.P1_estimator(f, x)\n",
        "        else:\n",
        "            raise ValueError(\"P must be 1, 2, 3, or 4\")\n",
        "\n",
        "# Uniform estimator implementation\n",
        "class UniformEstimator(GradEstimator):\n",
        "    \"\"\"Uniform estimator implementation.\n",
        "\n",
        "    This estimator uses uniformly distributed noise on the unit sphere.\n",
        "    \"\"\"\n",
        "\n",
        "    def generate_noise(self, x):\n",
        "        \"\"\"Generate uniform noise on the unit sphere.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to estimate the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The noise vector.\n",
        "        \"\"\"\n",
        "        ndim = len(x)\n",
        "        vec = np.random.randn(ndim)\n",
        "        vec /= np.linalg.norm(vec)\n",
        "        return vec * np.sqrt(ndim)\n",
        "\n",
        "    def estimate(self, f, x):\n",
        "        grad = np.zeros_like(x)\n",
        "\n",
        "        for i in range(self.zoo_batch_size):\n",
        "            v = self.generate_noise(x)\n",
        "            noisy_x = x + self.mu * v\n",
        "            diff = f(noisy_x) - f(x)\n",
        "            grad += diff * v\n",
        "\n",
        "        return grad / (self.mu * self.zoo_batch_size)\n",
        "\n",
        "# Centralized Uniform estimator implementation\n",
        "class CentralizedUniformEstimator(UniformEstimator):\n",
        "    def estimate(self, f, x):\n",
        "        grad = np.zeros_like(x)\n",
        "\n",
        "        for i in range(self.zoo_batch_size):\n",
        "            v = self.generate_noise(x)\n",
        "            noisy_x = x + self.mu * v\n",
        "            noisy_xx = x - self.mu * v\n",
        "            diff = f(noisy_x) - f(noisy_xx)\n",
        "            grad += diff * v\n",
        "\n",
        "        return grad / (2 * self.mu * self.zoo_batch_size)\n",
        "\n",
        "# Gaussian estimator implementation\n",
        "class GaussianEstimator(GradEstimator):\n",
        "    \"\"\"Gaussian estimator implementation.\n",
        "\n",
        "    This estimator uses Gaussian noise for gradient estimation.\n",
        "    \"\"\"\n",
        "\n",
        "    def generate_noise(self, x):\n",
        "        \"\"\"Generate Gaussian noise.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to estimate the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The noise vector.\n",
        "        \"\"\"\n",
        "        return np.random.randn(len(x))\n",
        "\n",
        "    def estimate(self, f, x):\n",
        "        grad = np.zeros_like(x)\n",
        "\n",
        "        for i in range(self.zoo_batch_size):\n",
        "            v = self.generate_noise(x)\n",
        "            noisy_x = x + self.mu * v\n",
        "            diff = f(noisy_x) - f(x)\n",
        "            grad += diff * v\n",
        "\n",
        "        return grad / (self.mu * self.zoo_batch_size)\n",
        "\n",
        "# Function implementations\n",
        "class QuadraticFunction:\n",
        "    \"\"\"Quadratic function implementation.\"\"\"\n",
        "\n",
        "    def __init__(self, n):\n",
        "        \"\"\"Initialize a quadratic function.\n",
        "\n",
        "        Args:\n",
        "            n (int): The dimension of the function.\n",
        "        \"\"\"\n",
        "        self.n = n\n",
        "        self.A = np.eye(n)  # Identity matrix for simplicity\n",
        "\n",
        "    def __call__(self, x):\n",
        "        \"\"\"Evaluate the function at a point.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to evaluate the function.\n",
        "\n",
        "        Returns:\n",
        "            float: The function value.\n",
        "        \"\"\"\n",
        "        return 0.5 * x.T @ self.A @ x\n",
        "\n",
        "    def grad(self, x):\n",
        "        \"\"\"Compute the true gradient at a point.\n",
        "\n",
        "        Args:\n",
        "            x (numpy.ndarray): The point at which to compute the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The true gradient.\n",
        "        \"\"\"\n",
        "        return self.A @ x\n",
        "\n",
        "class LogisticLossFunction:\n",
        "    \"\"\"Logistic loss function implementation.\"\"\"\n",
        "\n",
        "    def __init__(self, input_dim, n_samples=100, random_state=42):\n",
        "        \"\"\"Initialize a logistic loss function.\n",
        "\n",
        "        Args:\n",
        "            input_dim (int): The dimension of the input.\n",
        "            n_samples (int, optional): The number of samples. Defaults to 100.\n",
        "            random_state (int, optional): The random seed. Defaults to 42.\n",
        "        \"\"\"\n",
        "        self.input_dim = input_dim\n",
        "        self.n_samples = n_samples\n",
        "\n",
        "        # Generate random data\n",
        "        np.random.seed(random_state)\n",
        "        self.X = np.random.randn(n_samples, input_dim)\n",
        "        self.y = np.random.binomial(n=1, p=0.5, size=n_samples)\n",
        "\n",
        "    def __call__(self, w):\n",
        "        \"\"\"Evaluate the function at a point.\n",
        "\n",
        "        Args:\n",
        "            w (numpy.ndarray): The point at which to evaluate the function.\n",
        "\n",
        "        Returns:\n",
        "            float: The function value.\n",
        "        \"\"\"\n",
        "        z = self.X @ w\n",
        "        return np.mean(np.log(1 + np.exp(-self.y * z)))\n",
        "\n",
        "    def grad(self, w):\n",
        "        \"\"\"Compute the true gradient at a point.\n",
        "\n",
        "        Args:\n",
        "            w (numpy.ndarray): The point at which to compute the gradient.\n",
        "\n",
        "        Returns:\n",
        "            numpy.ndarray: The true gradient.\n",
        "        \"\"\"\n",
        "        z = self.X @ w\n",
        "        p = 1 / (1 + np.exp(-z))\n",
        "        return -self.X.T @ (self.y - p) / self.n_samples\n",
        "\n",
        "# Helper function to create estimators\n",
        "def create_estimator(name, zoo_batch_size=16, mu=1e-6):\n",
        "    \"\"\"Create an estimator by name.\n",
        "\n",
        "    Args:\n",
        "        name (str): The name of the estimator to create.\n",
        "        zoo_batch_size (int, optional): The batch size for gradient estimation. Defaults to 16.\n",
        "        mu (float, optional): The perturbation size. Defaults to 1e-6.\n",
        "\n",
        "    Returns:\n",
        "        GradEstimator: The created estimator.\n",
        "    \"\"\"\n",
        "    if name == \"gaussian\":\n",
        "        return GaussianEstimator(zoo_batch_size=zoo_batch_size, mu=mu)\n",
        "    elif name == \"uniform\":\n",
        "        return UniformEstimator(zoo_batch_size=zoo_batch_size, mu=mu)\n",
        "    elif name == \"bernoulli\":\n",
        "        # Not used in this example\n",
        "        return UniformEstimator(zoo_batch_size=zoo_batch_size, mu=mu)\n",
        "    else:\n",
        "        raise ValueError(f\"Unknown estimator: {name}\")\n",
        "\n",
        "def compare_multiple_estimators(custom_estimator, reference_names, function, x, batch_size=64, num_trials=10):\n",
        "    \"\"\"Compare a custom estimator against multiple reference estimators.\n",
        "\n",
        "    Args:\n",
        "        custom_estimator: The custom estimator to test\n",
        "        reference_names: List of names of reference estimators to compare with\n",
        "        function: The function to estimate gradients for\n",
        "        x: The point at which to estimate gradients\n",
        "        batch_size: Batch size for all estimators\n",
        "        num_trials: Number of trials to run\n",
        "\n",
        "    Returns:\n",
        "        dict: Dictionary mapping estimator names to their error lists\n",
        "    \"\"\"\n",
        "    # Set batch size\n",
        "    custom_estimator.zoo_batch_size = batch_size\n",
        "\n",
        "    # Create reference estimators\n",
        "    reference_estimators = {}\n",
        "    for name in reference_names:\n",
        "        if name == \"unbiased_p3\":\n",
        "            reference_estimators[name] = UnbiasedEstimator(P=3, zoo_batch_size=1, mu=custom_estimator.mu, a=2.0)\n",
        "        elif name == \"unbiased_p4\":\n",
        "            reference_estimators[name] = UnbiasedEstimator(P=4, zoo_batch_size=1, mu=custom_estimator.mu, a=2.0)\n",
        "        elif name == \"centralized_uniform\":\n",
        "            reference_estimators[name] = CentralizedUniformEstimator(zoo_batch_size=batch_size, mu=custom_estimator.mu)\n",
        "        else:\n",
        "            reference_estimators[name] = create_estimator(name, zoo_batch_size=batch_size, mu=custom_estimator.mu)\n",
        "\n",
        "    # Get true gradient\n",
        "    true_grad = function.grad(x)\n",
        "\n",
        "    # Store all errors\n",
        "    all_errors = {}\n",
        "    for name in reference_names:\n",
        "        all_errors[name.capitalize()] = []\n",
        "\n",
        "    # Run trials\n",
        "    for i in range(num_trials):\n",
        "        # Estimate with reference estimators\n",
        "        for name, estimator in reference_estimators.items():\n",
        "            reference_grad = estimator.estimate(function, x)\n",
        "            reference_error = np.linalg.norm(reference_grad - true_grad)\n",
        "            all_errors[name.capitalize()].append(reference_error)\n",
        "\n",
        "    # Print summary\n",
        "    print(\"\\nSummary:\")\n",
        "    for name in reference_names:\n",
        "        print(f\"{name.capitalize()} estimator - Mean error: {np.mean(all_errors[name.capitalize()]):.6f}, Std: {np.std(all_errors[name.capitalize()]):.6f}\")\n",
        "\n",
        "    return all_errors\n",
        "\n",
        "def run_experiment(function_type, dimensions, zoo_batch_size, num_trials, reference_names):\n",
        "    \"\"\"Run experiment for a specific function type across multiple dimensions.\n",
        "\n",
        "    Args:\n",
        "        function_type (str): Type of function to test ('quadratic' or 'logistic')\n",
        "        dimensions (list): List of dimensions to test\n",
        "        zoo_batch_size (int): Batch size for estimators\n",
        "        num_trials (int): Number of trials per dimension\n",
        "        reference_names (list): List of reference estimator names\n",
        "\n",
        "    Returns:\n",
        "        pd.DataFrame: DataFrame with experiment results\n",
        "    \"\"\"\n",
        "    # Create a DataFrame to store all results\n",
        "    all_results = []\n",
        "\n",
        "    for n in dimensions:\n",
        "        print(f\"\\n\\n===== Testing {function_type} function with dimension n = {n} =====\")\n",
        "\n",
        "        # Create function and test point based on function type\n",
        "        if function_type == 'quadratic':\n",
        "            f = QuadraticFunction(n)\n",
        "            x = np.random.normal(scale=5.0, size=n)\n",
        "        elif function_type == 'logistic':\n",
        "            f = LogisticLossFunction(input_dim=n, n_samples=500, random_state=42)\n",
        "            x = np.random.normal(scale=0.1, size=n)  # Smaller scale for logistic regression\n",
        "\n",
        "        # Create a dummy estimator for the compare_multiple_estimators function\n",
        "        mu = 1e-5\n",
        "        dummy_estimator = UnbiasedEstimator(zoo_batch_size=zoo_batch_size, mu=mu, a=2.0)\n",
        "\n",
        "        # Test against multiple reference estimators\n",
        "        print(f\"Testing estimators...\")\n",
        "        all_errors = compare_multiple_estimators(\n",
        "            dummy_estimator,\n",
        "            reference_names,\n",
        "            f,\n",
        "            x,\n",
        "            batch_size=zoo_batch_size,\n",
        "            num_trials=num_trials\n",
        "        )\n",
        "\n",
        "        # Add results to DataFrame\n",
        "        for method, errors in all_errors.items():\n",
        "            for error in errors:\n",
        "                all_results.append({\n",
        "                    'Function': function_type.capitalize(),\n",
        "                    'Dimension': n,\n",
        "                    'Method': method,\n",
        "                    'Error': error\n",
        "                })\n",
        "\n",
        "    # Convert to DataFrame\n",
        "    return pd.DataFrame(all_results)\n",
        "\n",
        "if __name__ == \"__main__\":\n",
        "    # Common parameters\n",
        "    zoo_batch_size = 3\n",
        "    reference_names = [\"unbiased_p4\", \"unbiased_p3\", \"gaussian\", \"uniform\", \"centralized_uniform\"]\n",
        "    # reference_names = [\"unbiased_p3\", \"gaussian\", \"uniform\", \"centralized_uniform\"]\n",
        "\n",
        "    # Dimensions to test for both functions\n",
        "    dimensions = [16, 64, 256, 1024, 4096]\n",
        "    num_trials = 100  # Reduced for faster execution\n",
        "\n",
        "    # Run experiments\n",
        "    print(\"Running quadratic function experiments...\")\n",
        "    quadratic_results = run_experiment('quadratic', dimensions, zoo_batch_size, num_trials, reference_names)\n",
        "\n",
        "    print(\"\\nRunning logistic function experiments...\")\n",
        "    logistic_results = run_experiment('logistic', dimensions, zoo_batch_size, num_trials, reference_names)\n",
        "\n",
        "    # Combine results\n",
        "    combined_results = pd.concat([quadratic_results, logistic_results])\n",
        "\n",
        "    # Define a consistent color palette for all methods\n",
        "    method_colors = {\n",
        "        'Unbiased_p3': '#ff7f00',   # orange\n",
        "        'Unbiased_p4': '#e41a1c',    # red\n",
        "        'Gaussian': '#377eb8',    # blue\n",
        "        'Uniform': '#4daf4a',      # green\n",
        "        'Centralized_uniform': '#984ea3'     # purple\n",
        "    }\n",
        "\n",
        "    # Set the style\n",
        "    sns.set_style(\"whitegrid\")\n",
        "    plt.rcParams.update({\n",
        "        'font.size': TICK_LABEL_FONTSIZE,\n",
        "        'axes.titlesize': SUBTITLE_FONTSIZE,\n",
        "        'axes.labelsize': AXIS_LABEL_FONTSIZE,\n",
        "        'xtick.labelsize': TICK_LABEL_FONTSIZE,\n",
        "        'ytick.labelsize': TICK_LABEL_FONTSIZE,\n",
        "        'legend.fontsize': LEGEND_FONTSIZE,\n",
        "    })\n",
        "\n",
        "    # Create a subplot grid\n",
        "    fig, axes = plt.subplots(1, 2, figsize=(18, 9), sharey=False)\n",
        "\n",
        "    # Plot quadratic function results\n",
        "    quadratic_data = combined_results[combined_results['Function'] == 'Quadratic']\n",
        "    b_quadratic = sns.boxplot(x='Dimension', y='Error', hue='Method', data=quadratic_data,\n",
        "                palette=method_colors, boxprops=dict(alpha=0.75), ax=axes[0])\n",
        "\n",
        "    # Add individual points for better visualization\n",
        "    sns.stripplot(x='Dimension', y='Error', hue='Method', data=quadratic_data,\n",
        "                 size=4, alpha=0.3, dodge=True, palette=method_colors, ax=axes[0])\n",
        "\n",
        "    # Improve plot appearance\n",
        "    axes[0].set_title('Quadratic Function', fontsize=SUBTITLE_FONTSIZE)\n",
        "    axes[0].set_xlabel('Dimension (d)', fontsize=AXIS_LABEL_FONTSIZE)\n",
        "    axes[0].set_ylabel('MSE Error', fontsize=AXIS_LABEL_FONTSIZE)\n",
        "    axes[0].set_yscale('log')\n",
        "    axes[0].legend([],[], frameon=False)  # Remove legend from first plot\n",
        "\n",
        "    # Plot logistic function results\n",
        "    logistic_data = combined_results[combined_results['Function'] == 'Logistic']\n",
        "    b_logistic = sns.boxplot(x='Dimension', y='Error', hue='Method', data=logistic_data,\n",
        "                palette=method_colors, boxprops=dict(alpha=0.75), ax=axes[1])\n",
        "\n",
        "    # Add individual points for better visualization\n",
        "    sns.stripplot(x='Dimension', y='Error', hue='Method', data=logistic_data,\n",
        "                 size=4, alpha=0.3, dodge=True, palette=method_colors, ax=axes[1])\n",
        "\n",
        "    # Improve plot appearance\n",
        "    axes[1].set_title('Logistic Function', fontsize=SUBTITLE_FONTSIZE)\n",
        "    axes[1].set_xlabel('Dimension (d)', fontsize=AXIS_LABEL_FONTSIZE)\n",
        "    axes[1].set_ylabel('MSE Error', fontsize=AXIS_LABEL_FONTSIZE)\n",
        "    axes[1].set_yscale('log')\n",
        "    axes[1].legend([],[], frameon=False)  # Remove legend from second plot\n",
        "\n",
        "    # Create a common legend at the bottom\n",
        "    handles, labels = axes[1].get_legend_handles_labels()\n",
        "\n",
        "    # Customize the labels with mathematical notation\n",
        "    custom_labels = []\n",
        "    for label in labels[:5]:\n",
        "        if label == 'Unbiased_p3':\n",
        "            custom_labels.append('$P_3$-Estimator')\n",
        "        elif label == 'Unbiased_p4':\n",
        "            custom_labels.append('$P_4$-Estimator')\n",
        "        elif label == 'Gaussian':\n",
        "            custom_labels.append('Gaussian')\n",
        "        elif label == 'Uniform':\n",
        "            custom_labels.append('Uniform')\n",
        "        elif label == 'Centralized_uniform':\n",
        "            custom_labels.append('Centralized Uniform')\n",
        "        else:\n",
        "            custom_labels.append(label)\n",
        "\n",
        "    fig.legend(handles[:5], custom_labels, loc='lower center', ncol=5,\n",
        "               title='Estimator', title_fontsize=LEGEND_FONTSIZE,\n",
        "               fontsize=LEGEND_FONTSIZE, bbox_to_anchor=(0.5, -0.05))\n",
        "\n",
        "    plt.tight_layout()\n",
        "    # Adjust the bottom margin to make room for the legend\n",
        "    plt.subplots_adjust(bottom=0.15)\n",
        "\n",
        "    plt.savefig('combined_dimension_comparison.png', dpi=300, bbox_inches='tight')\n",
        "\n",
        "    print(\"Experiment completed. Results saved to 'combined_dimension_comparison.png'\")"
      ]
    }
  ],
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}
