{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from privacy_estimates.experiments.aml import JobList"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## (1) Let's start with AgNews"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# first real, then synthetic - these are jobs for AgNews without canaries\n",
    "jobs = JobList.from_urls([\n",
    "    'https://ml.azure.com/runs/placid_wing_01zhxmz29r?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47#',\n",
    "    'https://ml.azure.com/runs/good_plate_pc7ht484bf?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47#'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "job = jobs[0]\n",
    "synthetic_job = jobs[1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "metrics = job.get_node('compute_utility_real').get_metrics()\n",
    "metrics_synthetic = synthetic_job.get_node('compute_utility_synthetic').get_metrics()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "metrics.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Real AUC: {metrics['eval_auc'][-1]}\")\n",
    "print(f\"Synthetic AUC: {metrics_synthetic['eval_auc'][-1]}\")\n",
    "print(f\"Real accuracy: {metrics['eval_accuracy'][-1]}\")\n",
    "print(f\"Synthetic accuracy: {metrics_synthetic['eval_accuracy'][-1]}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(1, 2, figsize=(10,5))\n",
    "\n",
    "# first do train real vs synthetic\n",
    "axes[0].plot(np.linspace(0, 1, len(metrics['loss'])), metrics['loss'], color = 'darkblue', label='Real')\n",
    "axes[0].plot(np.linspace(0, 1, len(metrics_synthetic['loss'])), metrics_synthetic['loss'], color = 'darkorange', label='Synthetic')\n",
    "axes[0].set_xticks([0, 0.5, 1])\n",
    "axes[0].set_xticklabels([0, 0.5, 1])\n",
    "axes[0].legend(fontsize=14)\n",
    "axes[0].grid()\n",
    "axes[0].set_xlabel('Epoch', fontsize=14)\n",
    "axes[0].set_ylabel('Loss', fontsize=14)\n",
    "axes[0].set_ylim(0, 1.0)\n",
    "axes[0].set_title('RoBERTa on AgNews - Train', fontsize=14)\n",
    "\n",
    "# now do eval loss\n",
    "axes[1].plot(np.linspace(0, 1, len(metrics['eval_loss'])), metrics['eval_loss'], color = 'darkblue', label='Real')\n",
    "axes[1].plot(np.linspace(0, 1, len(metrics_synthetic['eval_loss'])), metrics_synthetic['eval_loss'], color = 'darkorange', label='Synthetic')\n",
    "axes[1].set_xticks([0, 0.5, 1])\n",
    "axes[1].set_xticklabels([0, 0.5, 1])\n",
    "axes[1].legend(fontsize=14)\n",
    "axes[1].grid()\n",
    "axes[1].set_xlabel('Epoch', fontsize=14)\n",
    "axes[1].set_ylabel('Loss', fontsize=14)\n",
    "axes[1].set_ylim(0, 1.0)\n",
    "axes[1].set_title('RoBERTa on AgNews - Test', fontsize=14)\n",
    "\n",
    "plt.savefig('figures/utility_agnews.pdf', dpi=300, bbox_inches='tight', pad_inches=0)\n",
    "\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## (2) What about SST-2?"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# first real, then synthetic - these are jobs for SST-2 without canaries\n",
    "jobs = JobList.from_urls([\n",
    "    'https://ml.azure.com/runs/teal_screw_y44k8v2k0w?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47#',\n",
    "    'https://ml.azure.com/runs/brave_oregano_v2m17tb2rn?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47#'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "job = jobs[0]\n",
    "synthetic_job = jobs[1]\n",
    "\n",
    "metrics = job.get_node('compute_utility_real').get_metrics()\n",
    "metrics_synthetic = synthetic_job.get_node('compute_utility_synthetic').get_metrics()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Real AUC: {metrics['eval_auc'][-1]}\")\n",
    "print(f\"Synthetic AUC: {metrics_synthetic['eval_auc'][-1]}\")\n",
    "print(f\"Real accuracy: {metrics['eval_accuracy'][-1]}\")\n",
    "print(f\"Synthetic accuracy: {metrics_synthetic['eval_accuracy'][-1]}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(1, 2, figsize=(10,5))\n",
    "\n",
    "# first do train real vs synthetic\n",
    "axes[0].plot(np.linspace(0, 1, len(metrics['loss'])), metrics['loss'], color = 'darkblue', label='Real')\n",
    "axes[0].plot(np.linspace(0, 1, len(metrics_synthetic['loss'])), metrics_synthetic['loss'], color = 'darkorange', label='Synthetic')\n",
    "axes[0].set_xticks([0, 0.5, 1])\n",
    "axes[0].set_xticklabels([0, 0.5, 1])\n",
    "axes[0].legend(fontsize=14)\n",
    "axes[0].grid()\n",
    "axes[0].set_xlabel('Epoch', fontsize=14)\n",
    "axes[0].set_ylabel('Loss', fontsize=14)\n",
    "axes[0].set_ylim(0, 1.0)\n",
    "axes[0].set_title('RoBERTa on SST-2 - Train', fontsize=14)\n",
    "\n",
    "# now do eval loss\n",
    "axes[1].plot(np.linspace(0, 1, len(metrics['eval_loss'])), metrics['eval_loss'], color = 'darkblue', label='Real')\n",
    "axes[1].plot(np.linspace(0, 1, len(metrics_synthetic['eval_loss'])), metrics_synthetic['eval_loss'], color = 'darkorange', label='Synthetic')\n",
    "axes[1].set_xticks([0, 0.5, 1])\n",
    "axes[1].set_xticklabels([0, 0.5, 1])\n",
    "axes[1].legend(fontsize=14)\n",
    "axes[1].grid()\n",
    "axes[1].set_xlabel('Epoch', fontsize=14)\n",
    "axes[1].set_ylabel('Loss', fontsize=14)\n",
    "axes[1].set_ylim(0, 1.0)\n",
    "axes[1].set_title('RoBERTa on SST-2 - Test', fontsize=14)\n",
    "\n",
    "plt.savefig('figures/utility_sst2.pdf', dpi=300, bbox_inches='tight', pad_inches=0)\n",
    "\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## (3) Let's also look at this when we have included canaries"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "canary_to_url = {\n",
    "    'sst2_in_canary': 'https://ml.azure.com/runs/hungry_holiday_qczmtvhk9z?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47', \n",
    "    'sst2_syntheticcanary_uniformlabel': 'https://ml.azure.com/runs/purple_basil_ym4kcffrdq?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47',\n",
    "    'sst2_syntheticcanary_canarylabel': 'https://ml.azure.com/runs/sharp_farm_f0t24t04nx?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47',\n",
    "    'agnews_in_canary': 'https://ml.azure.com/runs/neat_circle_b73nft4qj2?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47',\n",
    "    'agnews_syntheticcanary_uniformlabel': 'https://ml.azure.com/runs/dynamic_lamp_9dth0rjpnj?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47',\n",
    "    'agnews_syntheticcanary_canarylabel': 'https://ml.azure.com/runs/honest_bee_3082g51276?wsid=/subscriptions/acc09744-1ee3-4242-b375-93421c63af0c/resourcegroups/PPML/workspaces/M365Research-PPML-EUS&tid=72f988bf-86f1-41af-91ab-2d7cd011db47'\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for canary_method in canary_to_url.keys():\n",
    "    print('Canary method: ', canary_method)\n",
    "    url = canary_to_url[canary_method]\n",
    "    if url != 'xx':\n",
    "        jobs = JobList.from_urls([url])\n",
    "        job = jobs[0]\n",
    "        metrics = job.get_node('compute_utility_synthetic').get_metrics()\n",
    "        print(f\"AUC: {metrics['eval_auc'][-1]}\")\n",
    "        print(f\"accuracy: {metrics['eval_accuracy'][-1]}\")\n",
    "    else:\n",
    "        print('No data available')\n",
    "    print('---')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "dp-transformers",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
