{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "e4760c69-bb95-4804-8f60-e2384c8cd0fb",
   "metadata": {},
   "source": [
    "第一部分的实验是针对噪声的方差，特别是x2的方差。\n",
    "1：噪声方差作为横坐标\n",
    "2：训练批次作为横坐标，看不同的方差对损失的影响\n",
    "\n",
    "\n",
    "第二部分预计变化x3到x16的方差，但是可能m后边要改为2，所以暂时不进行实验"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "4abe0306-efd5-4d86-95f6-b845d3e38b65",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_148/542168101.py:78: UserWarning: Creating a tensor from a list of numpy.ndarrays is extremely slow. Please consider converting the list to a single numpy.ndarray with numpy.array() before converting to a tensor. (Triggered internally at /opt/pytorch/pytorch/torch/csrc/utils/tensor_new.cpp:230.)\n",
      "  D = torch.tensor(D, dtype=torch.float32).cuda()\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "0\n",
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "0\n",
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "0\n",
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n"
     ]
    }
   ],
   "source": [
    "import math\n",
    "import numpy\n",
    "import numpy as np\n",
    "import torch\n",
    "from torch import nn, optim\n",
    "\n",
    "M = 16\n",
    "d = 1024\n",
    "n_ = 100\n",
    "dh = 512\n",
    "dv = 512\n",
    "\n",
    "class TF(nn.Module):\n",
    "    def __init__(self):\n",
    "        super().__init__()\n",
    "        self.q = nn.Linear(d, dh, bias=False)\n",
    "        self.k = nn.Linear(d, dh, bias=False)\n",
    "        self.v = nn.Linear(d, dv, bias=False)\n",
    "        self.fc = nn.Linear(dv, 1, bias=False)\n",
    "        self.fc.requires_grad_(False)\n",
    "        self.q.weight.data /= 16\n",
    "        self.k.weight.data /= 16\n",
    "        self.v.weight.data /= 16\n",
    "\n",
    "\n",
    "    def forward(self, x):\n",
    "        q = self.q(x)\n",
    "        k = self.k(x)\n",
    "        v = self.v(x)\n",
    "        qk = torch.matmul(q, k.transpose(1, 2))\n",
    "        attn = qk.softmax(dim=2)\n",
    "        attn = torch.sum(attn, dim=1).unsqueeze(1)\n",
    "        attn /= M\n",
    "        z = torch.matmul(attn, v).squeeze(1)\n",
    "        return self.fc(z)\n",
    "\n",
    "def make_mu1(mu):\n",
    "    mu1 = numpy.zeros(d)\n",
    "    mu1[0] = mu\n",
    "    return mu1\n",
    "\n",
    "def make_mu2(mu):\n",
    "    mu2 = numpy.zeros(d)\n",
    "    mu2[1] = mu\n",
    "    return mu2\n",
    "\n",
    "def make_noise(strength):\n",
    "    return numpy.random.normal(0, strength, size=d)\n",
    "\n",
    "def get_test_loss(n, mu, cp):\n",
    "    D = []\n",
    "    D_Y = []\n",
    "    D_ = []\n",
    "    D_Y_ = []\n",
    "\n",
    "    mu1 = make_mu1(mu)\n",
    "    mu2 = make_mu2(mu)\n",
    "\n",
    "    D_mu = []\n",
    "    D_mu_ = []\n",
    "\n",
    "    for i in range(int(n / 2)):\n",
    "        X = mu1.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D.append(X)\n",
    "        D_Y.append([1.])\n",
    "        D_mu.append(mu1.reshape(1, d))\n",
    "        X = mu2.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D.append(X)\n",
    "        D_Y.append([-1.])\n",
    "        D_mu.append(mu2.reshape(1, d))\n",
    "\n",
    "    D = torch.tensor(D, dtype=torch.float32).cuda()\n",
    "    D_Y = torch.tensor(D_Y).cuda()\n",
    "\n",
    "    for i in range(int(n_ / 2)):\n",
    "        X = mu1.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D_.append(X)\n",
    "        D_Y_.append([1.])\n",
    "        D_mu_.append(mu1.reshape(1, d))\n",
    "        X = mu2.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D_.append(X)\n",
    "        D_Y_.append([-1.])\n",
    "        D_mu_.append(mu2.reshape(1, d))\n",
    "\n",
    "    D_ = torch.tensor(D_, dtype=torch.float32).cuda()\n",
    "    D_Y_ = torch.tensor(D_Y_).cuda()\n",
    "\n",
    "    model = TF().cuda()\n",
    "\n",
    "    optimizer = optim.SGD(model.parameters(), lr=0.1, momentum=0)\n",
    "    loss_fn = nn.SoftMarginLoss().cuda()\n",
    "    EPOCHS = 1000\n",
    "\n",
    "    for epoch in range(1, EPOCHS + 1):\n",
    "        model.train()\n",
    "        optimizer.zero_grad()\n",
    "        output = model(D)\n",
    "\n",
    "        training_loss = loss_fn(output, D_Y)\n",
    "        training_loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "        model.eval()\n",
    "        output = model(D_)\n",
    "        test_loss = loss_fn(output, D_Y_)\n",
    "\n",
    "        if training_loss < 0.01:\n",
    "            return test_loss\n",
    "def Get_test_loss(n, mu,cp):\n",
    "    D = []\n",
    "    D_Y = []\n",
    "    D_ = []\n",
    "    D_Y_ = []\n",
    "\n",
    "    mu1 = make_mu1(mu)\n",
    "    mu2 = make_mu2(mu)\n",
    "\n",
    "    D_mu = []\n",
    "    D_mu_ = []\n",
    "\n",
    "    for i in range(int(n / 2)):\n",
    "        X = mu1.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D.append(X)\n",
    "        D_Y.append([1.])\n",
    "        D_mu.append(mu1.reshape(1, d))\n",
    "        X = mu2.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D.append(X)\n",
    "        D_Y.append([-1.])\n",
    "        D_mu.append(mu2.reshape(1, d))\n",
    "\n",
    "    D = torch.tensor(D, dtype=torch.float32).cuda()\n",
    "    D_Y = torch.tensor(D_Y).cuda()\n",
    "\n",
    "    for i in range(int(n_ / 2)):\n",
    "        X = mu1.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D_.append(X)\n",
    "        D_Y_.append([1.])\n",
    "        D_mu_.append(mu1.reshape(1, d))\n",
    "        X = mu2.copy().reshape(1, d)\n",
    "        X = numpy.concatenate((X, (make_noise(cp)).reshape(1, d)), 0)\n",
    "        for j in range(M - 2):\n",
    "            X = numpy.concatenate((X, (make_noise(0.2)).reshape(1, d)), 0)\n",
    "        D_.append(X)\n",
    "        D_Y_.append([-1.])\n",
    "        D_mu_.append(mu2.reshape(1, d))\n",
    "\n",
    "    D_ = torch.tensor(D_, dtype=torch.float32).cuda()\n",
    "    D_Y_ = torch.tensor(D_Y_).cuda()\n",
    "\n",
    "    model = TF().cuda()\n",
    "\n",
    "    optimizer = optim.SGD(model.parameters(), lr=0.1, momentum=0)\n",
    "    loss_fn = nn.SoftMarginLoss().cuda()\n",
    "    EPOCHS = 1000\n",
    "\n",
    "    test_losses = []\n",
    "    for epoch in range(1, EPOCHS + 1):\n",
    "        model.train()\n",
    "        optimizer.zero_grad()\n",
    "        output = model(D)\n",
    "\n",
    "        training_loss = loss_fn(output, D_Y)\n",
    "        training_loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "        model.eval()\n",
    "        output = model(D_)\n",
    "        test_loss = loss_fn(output, D_Y_)\n",
    "        # return test_loss\n",
    "        if epoch%10 == 0:\n",
    "            test_losses.append(test_loss.item())\n",
    "\n",
    "    return test_losses  \n",
    "        \n",
    "        \n",
    "size = 20\n",
    "n_scale = 2\n",
    "mu_scale = 1\n",
    "\n",
    "# 噪声强度（方差）作为横坐标\n",
    "matrix = np.zeros((size, 100))\n",
    "for n in range(size):\n",
    "    print(n)\n",
    "    for mu in range(100):\n",
    "        matrix[n, mu] = get_test_loss(100, 36, (mu+1)*0.1)\n",
    "np.savetxt('噪声方差.npy', matrix)\n",
    "\n",
    "# 迭代次数作为横坐标，探究不同的噪声方差对损失的影响\n",
    "matrix1 = np.zeros((20, 100))\n",
    "for n in range(20):\n",
    "    print(n)\n",
    "    test_losses = Get_test_loss(100, 16, 0.5)\n",
    "    matrix[n, :] = test_losses\n",
    "np.savetxt('0.5.npy', matrix1)\n",
    "                                      \n",
    "matrix2 = np.zeros((20, 100))\n",
    "for n in range(20):\n",
    "    print(n)\n",
    "    test_losses = Get_test_loss(100, 36,4)\n",
    "    matrix[n, :] = test_losses\n",
    "np.savetxt('4.npy', matrix2)\n",
    "\n",
    "matrix3 = np.zeros((20, 100))\n",
    "for n in range(20):\n",
    "    print(n)\n",
    "    test_losses = Get_test_loss(100, 64, 16)\n",
    "    matrix[n, :] = test_losses\n",
    "np.savetxt('16.npy', matrix3)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "07a3c271-e36b-4da8-ac33-a4046c29dc4a",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
