{"cells":[{"cell_type":"code","execution_count":1,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":21590,"status":"ok","timestamp":1727824900838,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"SG_KSqn32lo4","outputId":"76c5bea4-306a-4f8a-fa08-3203d5f6ffda"},"outputs":[{"name":"stdout","output_type":"stream","text":["Mounted at /content/drive\n","The autoreload extension is already loaded. To reload it, use:\n","  %reload_ext autoreload\n"]}],"source":["from google.colab import drive\n","drive.mount('/content/drive')\n","\n","# put folder name here\n","FOLDERNAME = 'multiclass_polyact/'\n","\n","import sys\n","sys.path.append('/content/drive/My Drive/{}'.format(FOLDERNAME))\n","\n","%load_ext autoreload\n","%autoreload 2\n","\n","import torch\n","import numpy as np\n","import matplotlib.pyplot as plt\n","import cvxpy as cp\n","\n","import os\n","from utils import *\n","%load_ext autoreload\n","%autoreload 2"]},{"cell_type":"code","execution_count":2,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":4455,"status":"ok","timestamp":1727824905282,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"JG8Kitv9iJW6","outputId":"f73e1363-d9b8-4732-c1ac-5b3831504723"},"outputs":[{"name":"stdout","output_type":"stream","text":["Collecting ucimlrepo\n","  Downloading ucimlrepo-0.0.7-py3-none-any.whl.metadata (5.5 kB)\n","Requirement already satisfied: pandas>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from ucimlrepo) (2.2.2)\n","Requirement already satisfied: certifi>=2020.12.5 in /usr/local/lib/python3.10/dist-packages (from ucimlrepo) (2024.8.30)\n","Requirement already satisfied: numpy>=1.22.4 in /usr/local/lib/python3.10/dist-packages (from pandas>=1.0.0->ucimlrepo) (1.26.4)\n","Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas>=1.0.0->ucimlrepo) (2.8.2)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas>=1.0.0->ucimlrepo) (2024.2)\n","Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.10/dist-packages (from pandas>=1.0.0->ucimlrepo) (2024.2)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas>=1.0.0->ucimlrepo) (1.16.0)\n","Downloading ucimlrepo-0.0.7-py3-none-any.whl (8.0 kB)\n","Installing collected packages: ucimlrepo\n","Successfully installed ucimlrepo-0.0.7\n"]}],"source":["!pip install ucimlrepo"]},{"cell_type":"code","execution_count":3,"metadata":{"executionInfo":{"elapsed":1320,"status":"ok","timestamp":1727824906599,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"ovTioE-9h41G"},"outputs":[],"source":["from ucimlrepo import fetch_ucirepo\n","\n","# fetch dataset\n","breast_cancer_wisconsin_original = fetch_ucirepo(id=15)\n","\n","# data (as pandas dataframes)\n","X = breast_cancer_wisconsin_original.data.features\n","y = breast_cancer_wisconsin_original.data.targets\n","X = X.fillna(0)\n","\n","train_frac = 0.8\n","x_np = X.to_numpy()\n","\n","# convert y vector of 2's and 4's to a vector of 1's and -1's.\n","y_np = 2 * ((y.to_numpy().squeeze() - 2) / 2) - 1\n","\n","n,d = x_np.shape\n","xtrain, ytrain = x_np[:int(train_frac*n), :], y_np[:int(train_frac*n)]\n","xtest, ytest = x_np[int(train_frac*n):, :], y_np[int(train_frac*n):]\n","mean, std = xtrain.mean(axis=0, keepdims = True), xtrain.std(axis=0, keepdims=True)\n","xtrain = (xtrain - mean)/(std + 1e-9)\n","xtest = (xtest - mean)/(std + 1e-9)\n","\n","def form_robust_psd_matrix_numpy(Z_tilde, lbda_i, w_i, x_i, y_i, r, d_r,a=0.09,b=0.5,c=0.47):\n","  Z_1, Z_2, Z_4 = Z_tilde[:-1,:-1], Z_tilde[:-1,-1:], Z_tilde[d_r-1:d_r,d_r-1:d_r]\n","  no_lambda_block = np.zeros((d_r+1,d_r+1))\n","\n","  b1 = cp.hstack((a*Z_1, a*Z_1 @ x_i.T - 0.5*b*Z_2))\n","  b2 =  cp.hstack(((a*Z_1 @ x_i.T - 0.5*b*Z_2).T, cp.reshape(forward_cp(x_i, Z_tilde) - w_i*y_i, (1,1))))\n","  no_lambda_block = cp.vstack((b1,b2))\n","\n","  lambda_block = np.eye(no_lambda_block.shape[0])\n","  lambda_block[-1,d_r:d_r+1] = -r.value**2\n","  return lbda_i*lambda_block + y_i * no_lambda_block\n","\n","def forward_cp(X, Z_tilde_sym, a=0.09, b=0.5, c=0.47):\n","  return a * cp.sum(cp.multiply(X, X @ Z_tilde_sym[:-1,:-1]), axis=1) + b * X @ Z_tilde_sym[:-1,-1] + c * Z_tilde_sym[-1,-1]\n","\n","def cvx_prob(x,y,r,beta, verbose=False, tol=1e-5,idxs=None, warm_start=False):\n","  if idxs is None:\n","    idxs = np.arange(x.shape[0])\n","  n, d = x.shape\n","  Z = cp.Variable((d + 1, d + 1), symmetric=True)\n","  Zp = cp.Variable((d + 1, d + 1), symmetric=True)\n","  w = cp.Variable(n)\n","  lbda = cp.Variable(n)\n","\n","  constraints = []\n","  for i in idxs:\n","    constraints =constraints + [form_robust_psd_matrix_numpy(Z-Zp, lbda[i], w[i], x[i:i+1], y[i], r, d) >> 0]\n","  constraints =constraints + [lbda >= 0, cp.trace(Z[:-1,:-1]) == Z[-1,-1], cp.trace(Zp[:-1,:-1]) == Zp[-1,-1], Z >>0, Zp >> 0]\n","  prob = cp.Problem(cp.Minimize(cp.sum(cp.pos(1 - w)) + beta*(Z[-1,-1] + Zp[-1,-1])), constraints)\n","  prob.solve(solver=cp.SCS, verbose=verbose, eps=tol, warm_start=warm_start)\n","  return prob, Z, Zp, w, lbda\n","\n","def cvx_nonrobust(x,y,beta):\n","  n, d = x.shape\n","  Z = cp.Variable((d + 1, d + 1), symmetric=True)\n","  Zp = cp.Variable((d + 1, d + 1), symmetric=True)\n","\n","  constraints = [cp.trace(Z[:-1,:-1]) == Z[-1,-1], cp.trace(Zp[:-1,:-1]) == Zp[-1,-1], Z >> 0, Zp >> 0]\n","  out = forward_cp(x, Z-Zp)\n","  prob = cp.Problem(cp.Minimize(cp.mean(cp.pos(1 - cp.multiply(y,out))) + beta*(Z[-1,-1] + Zp[-1,-1])), constraints)\n","  prob.solve()\n","  return prob, Z, Zp\n","\n","def evaluate_robust_accuracies(X, y, Z_tilde, device, magnitudes=0.1*np.arange(7)):\n","  out = {}\n","  for attack_size in magnitudes:\n","    out[attack_size] = accuracy(y, forward(X + fgsm(y, X, Z_tilde, device, magnitude=attack_size, order=np.inf), Z_tilde))\n","    print(round(attack_size, 3), ':', round(out[attack_size], 4))\n","  return out\n","\n","def flip_distance(Z_tilde, x, label):\n","    a,b,c = 0.09, 0.5, 0.47\n","    d = x.shape[1]\n","    gamma, s = cp.Variable((1,1)), cp.Variable((1, 1))\n","    A0, b0, c0 = -np.eye(x.shape[1]), x.T, -np.linalg.norm(x)**2\n","  \n","    A1 = label * a*(Z_tilde[:-1,:-1])\n","    b1 = label * (b/2)*(Z_tilde[:-1,-1])[:,None]\n","    c1 = label * c*Z_tilde[-1,-1][None][None]\n","    print(A1.shape, c1.shape, b1.shape)\n","    block1 = cp.bmat([[A0, b0], [b0.T, c0 + s]])\n","    block2 = gamma * cp.bmat([[A1, b1],[b1.T, c1]])\n","    constraints = [block2 - block1 >> 0, gamma >= 0]\n","    obj = cp.Maximize(s)\n","    prob = cp.Problem(obj,constraints)\n","    dist = prob.solve(solver=cp.SCS)\n","    return np.sqrt(dist)"]},{"cell_type":"code","execution_count":4,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":420,"status":"ok","timestamp":1727824907017,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"FTn8fvT33r8s","outputId":"f4255c4d-402b-4ede-a7f3-d733dfce3049"},"outputs":[{"name":"stdout","output_type":"stream","text":["5.309603108171895\n"]}],"source":["tot = 0\n","count = 0\n","out = []\n","for x1 in xtrain[ytrain == 1]:\n","  for x2 in xtrain[ytrain == -1]:\n","    cur = np.linalg.norm(x1-x2)\n","    out.append(cur)\n","    tot += cur\n","    count += 1\n","\n","print(tot/count)"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":263},"executionInfo":{"elapsed":28148,"status":"error","timestamp":1727824935164,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"ayv9I9BBEsE-","outputId":"63843c04-ae9a-49a0-a13d-97eeb86b78ce"},"outputs":[],"source":["beta = 0.01\n","robust_sizes = np.linspace(0.4,0.5,2)\n","avg_dists = []\n","clean_accs = []\n","robust_accs = []\n","clean = 0.0\n","robust = 0.8\n","warm_start = False\n","for robust_radius in robust_sizes[:20]: #robust_sizes:\n","  print(robust_radius)\n","  r = cp.Parameter(1)\n","  r.value = np.array([robust_radius])\n","  prob, Z, Zp, w, lbda = cvx_prob(xtrain, ytrain, r, beta, tol=1e-5, verbose=False, warm_start=warm_start)\n","  warm_start = True\n","\n","  Z_tilde = torch.tensor((Z-Zp).value)\n","\n","  out_dict = evaluate_robust_accuracies(torch.tensor(xtest), torch.tensor(ytest), Z_tilde, 'cpu', magnitudes = np.array([clean, robust]))\n","\n","  clean_accs.append(out_dict[clean])\n","  robust_accs.append(out_dict[robust])\n","\n","  count_robust = 0\n","  count_nonrobust = 0\n","  dists_robust = []\n","\n","\n","  for i, y in enumerate(ytest):\n","    curx = xtest[i:i+1]\n","    out_r = forward(torch.tensor(curx), Z_tilde)\n","    if np.sign(out_r) == y:\n","      count_robust += 1\n","      dist = flip_distance(Z_tilde.numpy(), curx, y)\n","      dists_robust.append(dist)\n","\n","  avg_dists.append(sum(dists_robust)/count_robust)"]},{"cell_type":"code","execution_count":null,"metadata":{"executionInfo":{"elapsed":12,"status":"aborted","timestamp":1727824935165,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"q3VYoJSxGpxj"},"outputs":[],"source":["nonrobust_p, Z_nonrobust, Zp_nonrobust = cvx_nonrobust(xtrain, ytrain, beta)\n","Z_tilde_nonrobust =torch.tensor((Z_nonrobust- Zp_nonrobust).value)\n","dists_nonrobust = []\n","for i, y in enumerate(ytest):\n","    curx = xtest[i:i+1]\n","    out_r = forward(torch.tensor(curx), Z_tilde_nonrobust)\n","    if np.sign(out_r) == y:\n","      count_robust += 1\n","      dist = flip_distance(Z_tilde_nonrobust.numpy(), curx, y)\n","      dists_nonrobust.append(dist)\n","avg_dists_nonrobust = sum(dists_nonrobust)/len(dists_nonrobust)"]},{"cell_type":"code","execution_count":null,"metadata":{"executionInfo":{"elapsed":12,"status":"aborted","timestamp":1727824935165,"user":{"displayName":"Daniel Kuelbs","userId":"00355856873650556171"},"user_tz":420},"id":"xkmKJhYWKeKM"},"outputs":[],"source":["fig, axs = plt.subplots(1,2, figsize=(12,3))\n","font_dict = {'fontsize': 14}\n","axs[0].plot(robust_sizes[:16], avg_dists[:16],'-', color='red', linewidth=2,label='Adversarial')\n","axs[0].hlines(avg_dists_nonrobust,robust_sizes[0], robust_sizes[16], linestyles='--', linewidth=2, color='black', label=r'Standard' )\n","axs[0].set_xlabel(r'Robust radius parameter $r$', **font_dict)\n","axs[0].set_ylabel(r'$d_\\mathcal{D}(x)$', **font_dict)\n","axs[0].set_xlim([robust_sizes[0], robust_sizes[15]])\n","\n","axs[1].plot(robust_sizes[:20], clean_accs[:20], '-', color='blue', linewidth=2, label='Clean Adversarial')\n","axs[1].plot(robust_sizes[:20], robust_accs[:20], '--', color='blue', linewidth=2,label=r'Robust Adversarial')\n","axs[1].hlines(nonrobust_fgsm_acc[robust], robust_sizes[0], robust_sizes[20], linestyles='--',linewidth=2,color='black', label = r'Robust Standard')\n","axs[1].set_xlabel(r'Robust radius parameter $r$', **font_dict)\n","axs[1].set_xlim([robust_sizes[0], robust_sizes[19]])\n","axs[1].set_ylabel(\"Test accuracy\", **font_dict)\n","\n","axs[0].legend(**font_dict, loc='upper left')\n","axs[1].legend(**font_dict, loc = 'center right', bbox_to_anchor=(1, 0.37), ncol=1)#, loc='center right')\n","fig.autofmt_xdate()\n","plt.savefig('BCW_dist_plot.png')"]}],"metadata":{"colab":{"authorship_tag":"ABX9TyPZNCDCMLy4KS3VtT1qc0xk","machine_shape":"hm","mount_file_id":"1-7XhFitzb1LoNokCrCh4R5JnZaqIlfKe","provenance":[{"file_id":"1KVVLH9xtLo0IqcjvF7NfdWC1y0VHw0P1","timestamp":1727570683163},{"file_id":"1jBuVGkekSDqpCh_HAbUC65TY2G-Kza6q","timestamp":1708812783527},{"file_id":"1l34JuZpxZkB3YTvTi7agJv733rb02KW_","timestamp":1693848094597},{"file_id":"1-7XhFitzb1LoNokCrCh4R5JnZaqIlfKe","timestamp":1693536802143}]},"kernelspec":{"display_name":"Python 3","name":"python3"},"language_info":{"name":"python"}},"nbformat":4,"nbformat_minor":0}
