{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Papers that write about linear regression under differential privacy:\n",
    "\n",
    "\"Old Techniques in Differentially Private Linear Regression\"\n",
    "https://proceedings.mlr.press/v98/sheffet19a/sheffet19a.pdf\n",
    "\n",
    "\"Revisiting differentially private linear regression\"\n",
    "https://auai.org/uai2018/proceedings/papers/40.pdf \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "TORCH: Using device: cuda:0\n",
      "A shape: torch.Size([60000, 784])\n",
      "A type: <class 'torch.Tensor'>\n",
      "Number of sign patterns generated: 100\n"
     ]
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import sys\n",
    "import torch\n",
    "import torchvision.transforms as transforms\n",
    "import torchvision.datasets as datasets\n",
    "\n",
    "import Conv_relus_MNIST as cvxnn\n",
    "import dp_linear\n",
    "\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\", category=UserWarning)\n",
    "warnings.filterwarnings(\"ignore\", category=FutureWarning)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "num_neurons = 4096  # Number of neurons, or number of random fourier features\n",
    "beta = 0.01  # coefficient for the regularization term, lower is fewer regularization, 0 is no regularization\n",
    "do_extend = False\n",
    "\n",
    "eps_target = 2.88\n",
    "eps_target = 8.91\n",
    "eps_target = 0.2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "torch.Size([60000, 28, 28])\n",
      "torch.Size([10000, 28, 28])\n",
      "A shape: torch.Size([60000, 784])\n",
      "A type: <class 'torch.Tensor'>\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_1449668/2106817826.py:29: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n",
      "  RAW_train = transform_normalize(torch.tensor(train_dataset.data).to(torch.float))\n",
      "/tmp/ipykernel_1449668/2106817826.py:30: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n",
      "  RAW_test = transform_normalize(torch.tensor(test_dataset.data).to(torch.float))\n",
      "/tmp/ipykernel_1449668/2106817826.py:37: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n",
      "  y_train = torch.tensor(train_dataset.targets).to(torch.int64)\n",
      "/tmp/ipykernel_1449668/2106817826.py:38: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n",
      "  y_test = torch.tensor(test_dataset.targets).to(torch.int64)\n"
     ]
    }
   ],
   "source": [
    "directory = '../datasets/'\n",
    "device = \"cuda:0\"\n",
    "\n",
    "transform_normalize = transforms.Lambda(lambda x: (x / 255.0) * 2 - 1)\n",
    "# transform_normalize = lambda x: x\n",
    "\n",
    "def transform_normalize_cifar(X):\n",
    "    renormalize = transforms.Normalize(mean=[0.507, 0.487, 0.441], std=[0.267, 0.256, 0.276])\n",
    "    X = X/255.0\n",
    "    X = X.transpose(1, 3)\n",
    "    X = renormalize(X)\n",
    "    X = X.transpose(1, 3)\n",
    "    return X\n",
    "\n",
    "\n",
    "dataset_name = \"MNIST\"\n",
    "if dataset_name == \"MNIST\":\n",
    "    train_dataset = datasets.MNIST(directory, train=True, download=True,transform=transforms.Compose([transforms.ToTensor()]))\n",
    "    test_dataset =  datasets.MNIST(directory, train=False, transform=transforms.Compose([transforms.ToTensor()]))\n",
    "elif dataset_name == \"CIFAR10\":\n",
    "    train_dataset = datasets.CIFAR10(directory, train=True, download=True,transform=transforms.Compose([transforms.ToTensor()]))\n",
    "    test_dataset =  datasets.CIFAR10(directory, train=False, transform=transforms.Compose([transforms.ToTensor()]))\n",
    "elif dataset_name == \"FMNIST\":\n",
    "    train_dataset = datasets.FashionMNIST(directory, train=True, download=True,transform=transforms.Compose([transforms.ToTensor()]))\n",
    "    test_dataset =  datasets.FashionMNIST(directory, train=False, transform=transforms.Compose([transforms.ToTensor()]))\n",
    "else:\n",
    "    raise ValueError(f\"Dataset {dataset_name} not supported\")\n",
    "\n",
    "RAW_train = transform_normalize(torch.tensor(train_dataset.data).to(torch.float))\n",
    "RAW_test = transform_normalize(torch.tensor(test_dataset.data).to(torch.float))\n",
    "print(RAW_train.shape)\n",
    "print(RAW_test.shape)\n",
    "# flatten along the 28x28 gray scale images\n",
    "RAW_train = RAW_train.reshape(RAW_train.shape[0], -1)\n",
    "RAW_test = RAW_test.reshape(RAW_test.shape[0], -1)\n",
    "\n",
    "y_train = torch.tensor(train_dataset.targets).to(torch.int64)\n",
    "y_test = torch.tensor(test_dataset.targets).to(torch.int64)\n",
    "\n",
    "y_hot_train = torch.zeros(y_train.shape[0], 10)\n",
    "y_hot_train.scatter_(1, y_train.unsqueeze(1), 1)\n",
    "y_hot_train = y_hot_train.to(device)\n",
    "\n",
    "\n",
    "num_train_samples, num_features = RAW_train.size()\n",
    "print('A shape: ' + str(RAW_train.shape))\n",
    "print('A type: ' + str(type(RAW_train)))\n",
    "\n",
    "beta = torch.tensor(beta).to(device)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Num neurons:     64 - Priv ReLU 20.0% +- 5.6% - Priv RFF: 24.5% +- 8.1%\n",
      "Num neurons:    128 - Priv ReLU 23.9% +- 6.9% - Priv RFF: 26.5% +- 4.6%\n",
      "Num neurons:    256 - Priv ReLU 22.4% +- 8.3% - Priv RFF: 29.5% +- 6.6%\n",
      "Num neurons:    512 - Priv ReLU 21.8% +- 4.5% - Priv RFF: 32.3% +- 5.2%\n",
      "Num neurons:   1024 - Priv ReLU 24.6% +- 6.4% - Priv RFF: 27.9% +- 7.8%\n",
      "Num neurons:   2048 - Priv ReLU 23.6% +- 9.5% - Priv RFF: 26.8% +- 5.7%\n",
      "Num neurons:   4096 - Priv ReLU 25.4% +- 6.0% - Priv RFF: 29.0% +- 5.9%\n",
      "Num neurons:   8192 - Priv ReLU 20.5% +- 6.5% - Priv RFF: 27.2% +- 5.3%\n"
     ]
    }
   ],
   "source": [
    "clip_rff = 2\n",
    "clip_relu = 8\n",
    "\n",
    "num_monte_carlo = 5\n",
    "\n",
    "for num_neurons in [64, 128, 256, 512, 1024, 2048, 4096, 8192]:\n",
    "    # ReLU features\n",
    "\n",
    "    X_relu_train, X_relu_test = dp_linear.generate_relu_features(RAW_train, RAW_test, num_neurons, do_extend=do_extend)\n",
    "    X_relu_train, X_relu_test = X_relu_train.to(device), X_relu_test.to(device)\n",
    "\n",
    "    # RFF features\n",
    "    gamma = 1.0 / (num_features * RAW_train.std()) # Heuristic for choosing gamma\n",
    "\n",
    "    X_rff, W, b = dp_linear.generate_rff(RAW_train, n_components=num_neurons, gamma=gamma, do_extend=do_extend)\n",
    "    X_rff = torch.hstack([X_rff, torch.ones((X_rff.shape[0], 1))]).to(device)\n",
    "\n",
    "    X_rff_test = dp_linear.generate_rff_test(RAW_test, W, b, num_neurons, do_extend=do_extend)\n",
    "    X_rff_test = torch.hstack([X_rff_test, torch.ones((X_rff_test.shape[0], 1))]).to(device)\n",
    "\n",
    "    results_df = pd.DataFrame(columns=[\n",
    "        \"seed\",\n",
    "        \"adassp_relu_test_acc\",\n",
    "        \"adassp_rff_test_acc\",\n",
    "    ])\n",
    "\n",
    "    for i in range(num_monte_carlo):\n",
    "        w_priv_ada_relu = dp_linear.adassp(X_relu_train, y_hot_train, eps_target, delta=1e-6)\n",
    "        w_priv_ada_rff = dp_linear.adassp(X_rff, y_hot_train, eps_target, delta=1e-6)\n",
    "\n",
    "        # ADASPP evaluation\n",
    "        # accuracy_adassp_relu = torch.mean((torch.argmax(X_relu_train @ w_priv_ada_relu, axis=1).cpu() == y_train).float())\n",
    "        accuracy_adassp_relu_test = torch.mean((torch.argmax(X_relu_test @ w_priv_ada_relu, axis=1).cpu() == y_test).float())\n",
    "        # accuracy_adassp_rff = torch.mean((torch.argmax(X_rff @ w_priv_ada_rff, axis=1).cpu() == y_train).float())\n",
    "        accuracy_adassp_rff_test = torch.mean((torch.argmax(X_rff_test @ w_priv_ada_rff, axis=1).cpu() == y_test).float())\n",
    "\n",
    "        results_df.loc[i] = [\n",
    "        i,\n",
    "        # 100 * accuracy_adassp_relu.item(),\n",
    "        100 * accuracy_adassp_relu_test.item(),\n",
    "        # 100 * accuracy_adassp_rff.item(),\n",
    "        100 * accuracy_adassp_rff_test.item()]\n",
    "\n",
    "    print(f\"Num neurons: {num_neurons:6} - \"\n",
    "          f\"Priv ReLU {results_df.adassp_relu_test_acc.mean():.1f}% +- {results_df.adassp_relu_test_acc.std()*1.96:.1f}% - \"\n",
    "          f\"Priv RFF: {results_df.adassp_rff_test_acc.mean():.1f}% +- {results_df.adassp_rff_test_acc.std()*1.96:.1f}%\", flush=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "pyt310",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
