{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": [],
      "gpuType": "L4",
      "machine_shape": "hm",
      "collapsed_sections": [
        "qTmY_XxLqWl-",
        "auHqb2pK7eIi"
      ]
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    },
    "accelerator": "GPU"
  },
  "cells": [
    {
      "cell_type": "markdown",
      "source": [
        "# **Material_1**"
      ],
      "metadata": {
        "id": "o5xywNmi7dKJ"
      }
    },
    {
      "cell_type": "markdown",
      "source": [
        "## **dataset: CIFAR10**"
      ],
      "metadata": {
        "id": "3Kv3LgP1FexC"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "9ON164sK6dJi",
        "outputId": "f644c719-091d-4cf2-df5d-323545c7ddd7"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Wed May 22 19:36:59 2024       \n",
            "+---------------------------------------------------------------------------------------+\n",
            "| NVIDIA-SMI 535.104.05             Driver Version: 535.104.05   CUDA Version: 12.2     |\n",
            "|-----------------------------------------+----------------------+----------------------+\n",
            "| GPU  Name                 Persistence-M | Bus-Id        Disp.A | Volatile Uncorr. ECC |\n",
            "| Fan  Temp   Perf          Pwr:Usage/Cap |         Memory-Usage | GPU-Util  Compute M. |\n",
            "|                                         |                      |               MIG M. |\n",
            "|=========================================+======================+======================|\n",
            "|   0  NVIDIA A100-SXM4-40GB          Off | 00000000:00:04.0 Off |                    0 |\n",
            "| N/A   38C    P0              48W / 400W |      2MiB / 40960MiB |      0%      Default |\n",
            "|                                         |                      |             Disabled |\n",
            "+-----------------------------------------+----------------------+----------------------+\n",
            "                                                                                         \n",
            "+---------------------------------------------------------------------------------------+\n",
            "| Processes:                                                                            |\n",
            "|  GPU   GI   CI        PID   Type   Process name                            GPU Memory |\n",
            "|        ID   ID                                                             Usage      |\n",
            "|=======================================================================================|\n",
            "|  No running processes found                                                           |\n",
            "+---------------------------------------------------------------------------------------+\n"
          ]
        }
      ],
      "source": [
        "! nvidia-smi"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "# Data processing\n",
        "import numpy as np\n",
        "import torch\n",
        "import torchvision\n",
        "import torch.nn as nn\n",
        "from matplotlib import pyplot as plt\n",
        "import torch\n",
        "from torch.utils.data import DataLoader, Subset\n",
        "import torch.optim as optim\n",
        "import torchvision.transforms as transforms\n",
        "from torch.utils.data import random_split\n",
        "from torch.utils.data import DataLoader, ConcatDataset, random_split\n",
        "\n",
        "transform = transforms.Compose(\n",
        "    [transforms.ToTensor(),\n",
        "     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])\n",
        "################################################################################################################################################\n",
        "# 50000 training images / 4 = 12500\n",
        "# Set download to True for the first use to automatically download the dataset\n",
        "all_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)\n",
        "test_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)\n",
        "print(len(all_set))  # Print the number of training samples\n",
        "print(len(test_set))  # Print the number of test samples\n",
        "e12_, e34_ = random_split(dataset=all_set, lengths=[25000, 25000], generator=torch.Generator().manual_seed(0))\n",
        "################################################################################################################################################\n",
        "num_classes = 10  # Number of classes\n",
        "samples_per_class = 10  # Number of samples to extract per class\n",
        "################################################################################################################################################\n",
        "# Extract samples from e12_\n",
        "extracted_samples_e12 = {class_idx: [] for class_idx in range(10)}  # Initialize a dictionary to store extracted samples\n",
        "for idx, (image, label) in enumerate(e12_):  # Extract specified number of samples from e12_ dataset\n",
        "    if len(extracted_samples_e12[label]) < 10:\n",
        "        extracted_samples_e12[label].append(idx)\n",
        "    if all(len(samples) == 10 for samples in extracted_samples_e12.values()):  # Check if required number of samples are extracted\n",
        "        break\n",
        "extracted_samples_flat_e12 = [sample_idx for samples in extracted_samples_e12.values() for sample_idx in samples]  # Flatten the list of extracted samples\n",
        "ee12_ = torch.utils.data.Subset(e12_, [idx for idx in range(len(e12_)) if idx not in extracted_samples_flat_e12])  # Remove extracted samples from e12_\n",
        "print(len(ee12_))  # Print the number of remaining samples in e12_\n",
        "extracted_subset_e12 = torch.utils.data.Subset(ee12_, extracted_samples_flat_e12)\n",
        "e12_extracted_loader = torch.utils.data.DataLoader(extracted_subset_e12, batch_size=100, shuffle=False, num_workers=0)\n",
        "e12_extracted_loader_iter = iter(e12_extracted_loader)\n",
        "e12_extracted_loader_image, e12_extracted_loader_label = next(e12_extracted_loader_iter)\n",
        "################################################################################################################################################\n",
        "# Extract samples from e34_\n",
        "extracted_samples_e34 = {class_idx: [] for class_idx in range(10)}  # Initialize a dictionary to store extracted samples\n",
        "for idx, (image, label) in enumerate(e34_):  # Extract specified number of samples from e34_ dataset\n",
        "    if len(extracted_samples_e34[label]) < 10:\n",
        "        extracted_samples_e34[label].append(idx)\n",
        "    if all(len(samples) == 10 for samples in extracted_samples_e34.values()):  # Check if required number of samples are extracted\n",
        "        break\n",
        "extracted_samples_flat_e34 = [sample_idx for samples in extracted_samples_e34.values() for sample_idx in samples]  # Flatten the list of extracted samples\n",
        "ee34_ = torch.utils.data.Subset(e34_, [idx for idx in range(len(e34_)) if idx not in extracted_samples_flat_e34])  # Remove extracted samples from e34_\n",
        "print(len(ee34_))  # Print the number of remaining samples in e34_\n",
        "extracted_subset_e34 = torch.utils.data.Subset(ee34_, extracted_samples_flat_e34)\n",
        "e34_extracted_loader = torch.utils.data.DataLoader(extracted_subset_e34, batch_size=100, shuffle=False, num_workers=0)\n",
        "e34_extracted_loader_iter = iter(e34_extracted_loader)\n",
        "e34_extracted_loader_image, e34_extracted_loader_label = next(e34_extracted_loader_iter)\n",
        "################################################################################################################################################\n",
        "# Concatenate the remaining samples from e12_ and e34_\n",
        "e1234 = ConcatDataset([ee12_, ee34_])\n",
        "e3412 = ConcatDataset([ee34_, ee12_])\n",
        "e1234_loader = torch.utils.data.DataLoader(e1234, batch_size=40, shuffle=True, num_workers=0)\n",
        "e3412_loader = torch.utils.data.DataLoader(e3412, batch_size=40, shuffle=True, num_workers=0)\n",
        "################################################################################################################################################\n",
        "# Set download to True for the first use to automatically download the dataset\n",
        "s_test_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)\n",
        "s_test_loader = torch.utils.data.DataLoader(s_test_set, batch_size=50000, shuffle=False, num_workers=0)\n",
        "s_test_data_iter = iter(s_test_loader)\n",
        "s_test_image, s_test_label = next(s_test_data_iter)\n",
        "print(s_test_image.shape)  # Print the shape of the test dataset images\n",
        "\n",
        "s_tra_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=False, transform=transform)\n",
        "s_tra_loader = torch.utils.data.DataLoader(s_tra_set, batch_size=10000, shuffle=False, num_workers=0)\n",
        "s_tra_data_iter = iter(s_tra_loader)\n",
        "s_tra_image, s_tra_label = next(s_tra_data_iter)\n",
        "################################################################################################################################################\n",
        "\n",
        "classes = ('plane', 'car', 'bird', 'cat',\n",
        "           'deer', 'dog', 'frog', 'horse', 'ship', 'truck')"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "iaaFKgl16f7L",
        "outputId": "6ac85152-52d6-4d2b-d97c-0825767b28cf"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to ./data/cifar-10-python.tar.gz\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 170498071/170498071 [00:02<00:00, 75016680.91it/s]\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Extracting ./data/cifar-10-python.tar.gz to ./data\n",
            "Files already downloaded and verified\n",
            "50000\n",
            "10000\n",
            "24900\n",
            "24900\n",
            "torch.Size([10000, 3, 32, 32])\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "import random\n",
        "\n",
        "## Sampling ## validation\n",
        "############################ e12_ ###########################\n",
        "class_indices = {class_idx: [] for class_idx in range(10)}  # Initialize dictionary to store class indices\n",
        "for idx, (image, label) in enumerate(ee12_):  # Enumerate through ee12_ dataset\n",
        "    class_indices[label].append(idx)  # Append index to corresponding class\n",
        "sample_indices_12 = []\n",
        "for class_idx, indices in class_indices.items():  # For each class, sample 10 indices\n",
        "    sample_indices_12.extend(random.sample(indices, 10))\n",
        "sample_e12 = torch.utils.data.Subset(ee12_, sample_indices_12)  # Create a subset of ee12_ with sampled indices\n",
        "e12_s_loader = torch.utils.data.DataLoader(sample_e12, batch_size=100, shuffle=False, num_workers=0)  # DataLoader for the sampled subset\n",
        "e12_s_loader_iter = iter(e12_s_loader)  # Create an iterator\n",
        "e12_s_loader_image, e12_s_loader_label = next(e12_s_loader_iter)  # Get a batch of images and labels\n",
        "\n",
        "############################ e34_ ###########################\n",
        "class_indices = {class_idx: [] for class_idx in range(10)}  # Initialize dictionary to store class indices\n",
        "for idx, (image, label) in enumerate(ee34_):  # Enumerate through ee34_ dataset\n",
        "    class_indices[label].append(idx)  # Append index to corresponding class\n",
        "sample_indices_34 = []\n",
        "for class_idx, indices in class_indices.items():  # For each class, sample 10 indices\n",
        "    sample_indices_34.extend(random.sample(indices, 10))\n",
        "sample_e34 = torch.utils.data.Subset(ee34_, sample_indices_34)  # Create a subset of ee34_ with sampled indices\n",
        "e34_s_loader = torch.utils.data.DataLoader(sample_e34, batch_size=100, shuffle=False, num_workers=0)  # DataLoader for the sampled subset\n",
        "e34_s_loader_iter = iter(e34_s_loader)  # Create an iterator\n",
        "e34_s_loader_image, e34_s_loader_label = next(e34_s_loader_iter)  # Get a batch of images and labels"
      ],
      "metadata": {
        "id": "vhu3-AU_6roi"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "cuda = True if torch.cuda.is_available() else False"
      ],
      "metadata": {
        "id": "XnbhhnBk60kC"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "### **Network1 : use only linear layers + Generalization Decision Process (GDP)**"
      ],
      "metadata": {
        "id": "qTmY_XxLqWl-"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import argparse\n",
        "import os\n",
        "import numpy as np\n",
        "import torchvision.transforms as transforms\n",
        "from torchvision.utils import save_image\n",
        "from torch.utils.data import DataLoader\n",
        "from torchvision import datasets\n",
        "from torch.autograd import Variable\n",
        "import torch.nn as nn\n",
        "import torch\n",
        "\n",
        "class LLNet(nn.Module):  # Use only linear layers\n",
        "    def __init__(self):\n",
        "        super(LLNet, self).__init__()\n",
        "\n",
        "        self.fc1 = nn.Linear(3*32*32, 1000)  # First fully connected layer\n",
        "        self.fc2 = nn.Linear(1000, 500)      # Second fully connected layer\n",
        "        self.fc3 = nn.Linear(500, 100)       # Third fully connected layer\n",
        "        self.fc4 = nn.Linear(100, 50)        # Fourth fully connected layer\n",
        "        self.fc5 = nn.Linear(50, 25)         # Fifth fully connected layer\n",
        "        self.fc6 = nn.Linear(25, 20)         # Sixth fully connected layer\n",
        "        self.fc7 = nn.Linear(20, 10)         # Seventh fully connected layer (output layer)\n",
        "\n",
        "    def forward(self, x):\n",
        "        x = x.view(-1, 3*32*32)  # Flatten the input image\n",
        "        x = self.fc1(x)  # Apply first fully connected layer\n",
        "        x = self.fc2(x)  # Apply second fully connected layer\n",
        "        x = self.fc3(x)  # Apply third fully connected layer\n",
        "        x = self.fc4(x)  # Apply fourth fully connected layer\n",
        "        x = self.fc5(x)  # Apply fifth fully connected layer\n",
        "        x = self.fc6(x)  # Apply sixth fully connected layer\n",
        "        x = self.fc7(x)  # Apply seventh fully connected layer (output)\n",
        "        return x\n",
        "\n",
        "loss_function = torch.nn.CrossEntropyLoss()  # Define the loss function\n",
        "net = LLNet()  # Instantiate the network\n",
        "\n",
        "# If a GPU is available, run everything in CUDA mode\n",
        "if torch.cuda.is_available():\n",
        "    net = net.cuda()  # Move the network to GPU\n",
        "    loss_function = loss_function.cuda()  # Move the loss function to GPU\n",
        "\n",
        "optimizer_L = torch.optim.Adam(net.parameters(), lr=0.001)  # Define the optimizer with a learning rate of 0.001"
      ],
      "metadata": {
        "id": "9g4x7gTS60zS"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "from collections import Counter, defaultdict\n",
        "from itertools import combinations\n",
        "import random\n",
        "\n",
        "a_train = []  # To store training accuracy\n",
        "a_test = []  # To store test accuracy\n",
        "lossaaa = []  # To store loss values\n",
        "Inf = []  # To store information values\n",
        "Var_all = []  # To store all variation values\n",
        "Generalization_Ratio_ = []  # To store generalization ratios\n",
        "dicide_action = []  # To store decision actions\n",
        "loss_before = torch.tensor(30.0)  # Initial loss value\n",
        "los = torch.tensor(30.0)  # Initial loss value\n",
        "dis_before_A1 = torch.tensor(0)  # Distance before action A1\n",
        "dis_before_A2 = torch.tensor(0)  # Distance before action A2\n",
        "dis = torch.tensor(1)  # Distance increment\n",
        "per = \"N\"  # Previous iteration's action\n",
        "state_before = torch.tensor(0.0)  # Previous state value\n",
        "categrary_number = 10  # Number of categories\n",
        "tra_val_number = 2  # Training validation number\n",
        "\n",
        "for epoch in range(5):  # Loop over the dataset multiple times\n",
        "    e3412_iter = iter(e3412_loader)  # Iterator for e3412_loader\n",
        "    running_loss = 0.0  # Running loss\n",
        "    running_loss_all = 0.0  # Running loss for all\n",
        "    loss_before = Variable(loss_before, requires_grad=False)  # Make loss_before a variable\n",
        "    los = Variable(los, requires_grad=False)  # Make los a variable\n",
        "    state_before = Variable(state_before, requires_grad=False)  # Make state_before a variable\n",
        "    dis_before_A1 = Variable(dis_before_A1, requires_grad=False)  # Make dis_before_A1 a variable\n",
        "    dis_before_A2 = Variable(dis_before_A2, requires_grad=False)  # Make dis_before_A2 a variable\n",
        "    acc_A1 = Variable(dis_before_A1, requires_grad=False)  # Make acc_A1 a variable\n",
        "    acc_A2 = Variable(dis_before_A2, requires_grad=False)  # Make acc_A2 a variable\n",
        "    dis_ = Variable(dis, requires_grad=False)  # Make dis a variable\n",
        "\n",
        "    for step, (imgs, labels) in enumerate(e1234_loader):  # Iterate over the data\n",
        "        ### calculate losses\n",
        "        weight_val_probility = 1.0 / tra_val_number  # Weight for validation probability\n",
        "        labels = labels.cuda()  # Move labels to GPU\n",
        "        imgs = imgs.cuda()  # Move images to GPU\n",
        "        out_e1234 = net(imgs)  # Get output from the network\n",
        "        loss_out_e1234 = loss_function(out_e1234, labels)  # Calculate loss for e1234 (A1)\n",
        "\n",
        "        e3412_imgs, e3412_labels = next(e3412_iter)  # Get next batch from e3412_iter\n",
        "        e3412_imgs = e3412_imgs.cuda()  # Move e3412 images to GPU\n",
        "        e3412_labels = e3412_labels.cuda()  # Move e3412 labels to GPU\n",
        "        out_e3412 = net(e3412_imgs)  # Get output from the network\n",
        "        loss_out_e3412 = loss_function(out_e3412, e3412_labels)  # Calculate loss for e3412 (A3)\n",
        "\n",
        "        #################### extract\n",
        "        ## e1 ext count\n",
        "        e12_extracted_loader_image = e12_extracted_loader_image.cuda()  # Move e12 extracted images to GPU\n",
        "        e12_extracted_loader_label = e12_extracted_loader_label.cuda()  # Move e12 extracted labels to GPU\n",
        "        e12_extracted_out = net(e12_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e12_extracted = torch.max(e12_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ## e2 ext count\n",
        "        e34_extracted_loader_image = e34_extracted_loader_image.cuda()  # Move e34 extracted images to GPU\n",
        "        e34_extracted_loader_label = e34_extracted_loader_label.cuda()  # Move e34 extracted labels to GPU\n",
        "        e34_extracted_out = net(e34_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e34_extracted = torch.max(e34_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ########### e1 count\n",
        "        e12_s_loader_image = e12_s_loader_image.cuda()  # Move e12 sample images to GPU\n",
        "        e12_s_loader_label = e12_s_loader_label.cuda()  # Move e12 sample labels to GPU\n",
        "        e12_inform_out = net(e12_s_loader_image).detach()  # Get detached output from the network\n",
        "        e12_inform = torch.max(e12_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e12_inform = torch.chunk(e12_inform, 10)  # Split e12 inform into 10 chunks\n",
        "        split_e12_inform = list(split_e12_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e12_inform)):\n",
        "            counts_E12 = torch.bincount(split_e12_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e12 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e12[category] = counts_E12[category]  # Update counts\n",
        "            split_e12_inform[i] = counts_e12  # Store updated counts\n",
        "\n",
        "        ########### e2 count\n",
        "        e34_s_loader_image = e34_s_loader_image.cuda()  # Move e34 sample images to GPU\n",
        "        e34_s_loader_label = e34_s_loader_label.cuda()  # Move e34 sample labels to GPU\n",
        "        e34_inform_out = net(e34_s_loader_image).detach()  # Get detached output from the network\n",
        "        e34_inform = torch.max(e34_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e34_inform = torch.chunk(e34_inform, 10)  # Split e34 inform into 10 chunks\n",
        "        split_e34_inform = list(split_e34_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e34_inform)):\n",
        "            counts_E34 = torch.bincount(split_e34_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e34 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e34[category] = counts_E34[category]  # Update counts\n",
        "            split_e34_inform[i] = counts_e34  # Store updated counts\n",
        "\n",
        "        ##########\n",
        "        ## IN_IN_pro\n",
        "        counts_i_12 = torch.bincount(e12_inform, minlength=10)  # Count occurrences for e12 inform\n",
        "        counts_i_34 = torch.bincount(e34_inform, minlength=10)  # Count occurrences for e34 inform\n",
        "        counts_in_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_in_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_12[category] = counts_i_12[category]  # Update counts for e12\n",
        "        total_samples_in_12 = len(e12_inform)  # Total samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_34[category] = counts_i_34[category]  # Update counts for e34\n",
        "        total_samples_in_34 = len(e34_inform)  # Total samples in e34\n",
        "\n",
        "        min_denominator_in_12 = total_samples_in_12 * 1e-6  # Minimum denominator for e12\n",
        "        probabilities_in_12 = counts_in_12 / (total_samples_in_12 + min_denominator_in_12)  # Probabilities for e12\n",
        "        probabilities_tensor_in_12 = probabilities_in_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12\n",
        "\n",
        "        min_denominator_in_34 = total_samples_in_34 * 1e-6  # Minimum denominator for e34\n",
        "        probabilities_in_34 = counts_in_34 / (total_samples_in_34 + min_denominator_in_34)  # Probabilities for e34\n",
        "        probabilities_tensor_in_34 = probabilities_in_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34\n",
        "\n",
        "        counts_ext_12 = torch.bincount(e12_extracted, minlength=10)  # Count occurrences for e12 extracted\n",
        "        counts_ext_34 = torch.bincount(e34_extracted, minlength=10)  # Count occurrences for e34 extracted\n",
        "        counts_extra_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_extra_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_12[category] = counts_ext_12[category]  # Update counts for e12 extracted\n",
        "        total_extracted_in_12 = len(e12_extracted)  # Total extracted samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_34[category] = counts_ext_34[category]  # Update counts for e34 extracted\n",
        "        total_extracted_in_34 = len(e34_extracted)  # Total extracted samples in e34\n",
        "\n",
        "        min_denominator_ext_12 = total_extracted_in_12 * 1e-6  # Minimum denominator for e12 extracted\n",
        "        probabilities_ext_12 = counts_extra_12 / (total_extracted_in_12 + min_denominator_ext_12)  # Probabilities for e12 extracted\n",
        "        probabilities_tensor_extra_12 = probabilities_ext_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12 extracted\n",
        "\n",
        "        min_denominator_ext_34 = total_extracted_in_34 * 1e-6  # Minimum denominator for e34 extracted\n",
        "        probabilities_ext_34 = counts_extra_34 / (total_extracted_in_34 + min_denominator_ext_34)  # Probabilities for e34 extracted\n",
        "        probabilities_tensor_extra_34 = probabilities_ext_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34 extracted\n",
        "\n",
        "        ############################### Variation x ###################################\n",
        "        in_12_all = probabilities_tensor_in_12\n",
        "        in_34_all = probabilities_tensor_in_34\n",
        "        in_12_extra = probabilities_tensor_extra_12\n",
        "        in_34_extra = probabilities_tensor_extra_34\n",
        "        weight_tra_probility_all = 1.0 / 2\n",
        "        dow_all = \\\n",
        "              (in_12_all*weight_tra_probility_all + in_34_all*weight_tra_probility_all +\n",
        "              in_12_extra*weight_tra_probility_all + in_34_extra*weight_tra_probility_all + 1e-30)\n",
        "        in_1_all = (in_12_all*weight_tra_probility_all) / dow_all\n",
        "        in_2_all = (in_34_all*weight_tra_probility_all) / dow_all\n",
        "        e_1_all = (in_12_extra*weight_tra_probility_all) / dow_all\n",
        "        e_2_all = (in_34_extra*weight_tra_probility_all) / dow_all\n",
        "        in_1_all = in_1_all[0]\n",
        "        in_2_all = in_2_all[0]\n",
        "        e_1_all = e_1_all[0]\n",
        "        e_2_all = e_2_all[0]\n",
        "        d_KL_all = torch.zeros(10)\n",
        "        k_divergence_all = (in_1_all + 1e-30) * torch.log(in_1_all / (e_1_all + 1e-30) + 1e-30)\n",
        "        k_divergence_all_ = (in_1_all + 1e-30) * torch.log(in_1_all / (e_2_all + 1e-30) + 1e-30)\n",
        "        d_KL_all = torch.max(abs(k_divergence_all))\n",
        "        d_KL_all_ = torch.max(abs(k_divergence_all_))\n",
        "        Variation_all = torch.max(d_KL_all, d_KL_all_)\n",
        "        Var_all.append(Variation_all)\n",
        "\n",
        "        ############################ Information ###################################\n",
        "        all_combinations = list(combinations(range(10), 2))\n",
        "        K = categrary_number * (categrary_number - 1)\n",
        "        result_tensor = torch.zeros(len(all_combinations) * 2)  # Calculate the difference of each pair of combinations and store in result tensor\n",
        "        for c in range(10):\n",
        "            for idx, (i, j) in enumerate(all_combinations):\n",
        "                s1 = abs(((split_e12_inform[c][i]/10) + 1e-30) * torch.log((split_e12_inform[c][i]/10) / ((split_e12_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                s3 = abs(((split_e34_inform[c][i]/10) + 1e-30) * torch.log((split_e34_inform[c][i]/10) / ((split_e34_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                min_value = torch.min(s1, s3)\n",
        "                result_tensor[idx] = min_value.item()\n",
        "                idx_ = idx + len(all_combinations)\n",
        "                s1_ = abs(((split_e12_inform[c][j]/10) + 1e-30) * torch.log((split_e12_inform[c][j]/10) / ((split_e12_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                s3_ = abs(((split_e34_inform[c][j]/10) + 1e-30) * torch.log((split_e34_inform[c][j]/10) / ((split_e34_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                min_value_ = torch.min(s1_, s3_)\n",
        "                result_tensor[idx_] = min_value_.item()\n",
        "        Information = torch.sum(result_tensor) / K\n",
        "        Inf.append(Information)\n",
        "\n",
        "        ############################ Generalization_Ratio ###################################\n",
        "        Generalization_Ratio = Variation_all * (Information + 1.0) / Information\n",
        "        Generalization_Ratio_.append(Generalization_Ratio)\n",
        "\n",
        "        ############################ Generalization Decision Process (GDP) ###################################\n",
        "        state_now = Generalization_Ratio\n",
        "        loss_before = loss_before.cuda()\n",
        "        state_before = state_before.cuda()\n",
        "        state_dis = state_now - state_before\n",
        "        result_tensor = torch.cat((loss_out_e1234.unsqueeze(0), loss_out_e3412.unsqueeze(0)), 0)\n",
        "\n",
        "        # Because two datasets loss_out_e1234 and loss_out_e3412 are used, and there are actions A1 and A2,\n",
        "        # choose one based on the reward\n",
        "        if state_dis >= 0.0:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "        else:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "\n",
        "        ####################################\n",
        "        #### optimizer\n",
        "        los = loss - loss_before\n",
        "        state_before = state_now\n",
        "        optimizer_L.zero_grad()\n",
        "        loss.backward()\n",
        "        optimizer_L.step()\n",
        "        loss_before = loss\n",
        "        running_loss += loss.item()\n",
        "\n",
        "        # Print statistics\n",
        "        if step % 5 == 4:  # Print every 500 mini-batches\n",
        "            with torch.no_grad():  # 'with' is a context manager\n",
        "                s_test_image = s_test_image.cuda()\n",
        "                s_test_label = s_test_label.cuda()\n",
        "                s_tra_image = s_tra_image.cuda()\n",
        "                s_tra_label = s_tra_label.cuda()\n",
        "                outputs = net(s_test_image)  # [batch, 10]\n",
        "                predict_y = torch.max(outputs, dim=1)[1]\n",
        "                accuracy = torch.eq(predict_y, s_test_label).sum().item() / s_test_label.size(0)\n",
        "                a_test.append(float(accuracy))\n",
        "                outputs_t = net(s_tra_image)  # [batch, 10]\n",
        "                predict_y_t = torch.max(outputs_t, dim=1)[1]\n",
        "                accuracy_t = torch.eq(predict_y_t, s_tra_label).sum().item() / s_tra_label.size(0)\n",
        "                a_train.append(float(accuracy_t))\n",
        "                lossaaa.append(float(running_loss / 5))\n",
        "                print('[%d, %5d] train_loss: %.3f train_accuracy: %.3f test_accuracy: %.3f' %\n",
        "                      (epoch + 1, step + 1, running_loss / 5, accuracy_t, accuracy))\n",
        "                running_loss = 0.0\n",
        "                running_loss = 0.0"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "_xyJjELa7Bql",
        "outputId": "70e7bdd6-2d5a-4ea8-c797-88b4f4864513"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "[1,     5] train_loss: 2.287 train_accuracy: 0.204 test_accuracy: 0.205\n",
            "[1,    10] train_loss: 2.102 train_accuracy: 0.216 test_accuracy: 0.217\n",
            "[1,    15] train_loss: 2.142 train_accuracy: 0.214 test_accuracy: 0.207\n",
            "[1,    20] train_loss: 2.094 train_accuracy: 0.242 test_accuracy: 0.237\n",
            "[1,    25] train_loss: 2.087 train_accuracy: 0.259 test_accuracy: 0.268\n",
            "[1,    30] train_loss: 1.935 train_accuracy: 0.273 test_accuracy: 0.269\n",
            "[1,    35] train_loss: 2.063 train_accuracy: 0.274 test_accuracy: 0.272\n",
            "[1,    40] train_loss: 2.122 train_accuracy: 0.276 test_accuracy: 0.272\n",
            "[1,    45] train_loss: 1.929 train_accuracy: 0.267 test_accuracy: 0.256\n",
            "[1,    50] train_loss: 1.958 train_accuracy: 0.288 test_accuracy: 0.282\n",
            "[1,    55] train_loss: 1.889 train_accuracy: 0.270 test_accuracy: 0.266\n",
            "[1,    60] train_loss: 2.039 train_accuracy: 0.285 test_accuracy: 0.279\n",
            "[1,    65] train_loss: 1.980 train_accuracy: 0.308 test_accuracy: 0.309\n",
            "[1,    70] train_loss: 2.049 train_accuracy: 0.293 test_accuracy: 0.291\n",
            "[1,    75] train_loss: 2.008 train_accuracy: 0.299 test_accuracy: 0.298\n",
            "[1,    80] train_loss: 2.029 train_accuracy: 0.290 test_accuracy: 0.286\n",
            "[1,    85] train_loss: 2.092 train_accuracy: 0.255 test_accuracy: 0.264\n",
            "[1,    90] train_loss: 1.976 train_accuracy: 0.260 test_accuracy: 0.265\n",
            "[1,    95] train_loss: 1.972 train_accuracy: 0.268 test_accuracy: 0.276\n",
            "[1,   100] train_loss: 2.041 train_accuracy: 0.296 test_accuracy: 0.302\n",
            "[1,   105] train_loss: 1.900 train_accuracy: 0.282 test_accuracy: 0.287\n",
            "[1,   110] train_loss: 2.069 train_accuracy: 0.271 test_accuracy: 0.263\n",
            "[1,   115] train_loss: 1.911 train_accuracy: 0.277 test_accuracy: 0.278\n",
            "[1,   120] train_loss: 1.935 train_accuracy: 0.285 test_accuracy: 0.290\n",
            "[1,   125] train_loss: 2.019 train_accuracy: 0.294 test_accuracy: 0.290\n",
            "[1,   130] train_loss: 1.879 train_accuracy: 0.262 test_accuracy: 0.261\n",
            "[1,   135] train_loss: 2.041 train_accuracy: 0.254 test_accuracy: 0.257\n",
            "[1,   140] train_loss: 1.915 train_accuracy: 0.308 test_accuracy: 0.311\n",
            "[1,   145] train_loss: 2.109 train_accuracy: 0.272 test_accuracy: 0.271\n",
            "[1,   150] train_loss: 1.981 train_accuracy: 0.301 test_accuracy: 0.296\n",
            "[1,   155] train_loss: 1.918 train_accuracy: 0.302 test_accuracy: 0.295\n",
            "[1,   160] train_loss: 1.996 train_accuracy: 0.311 test_accuracy: 0.306\n",
            "[1,   165] train_loss: 1.940 train_accuracy: 0.291 test_accuracy: 0.292\n",
            "[1,   170] train_loss: 1.906 train_accuracy: 0.294 test_accuracy: 0.293\n",
            "[1,   175] train_loss: 1.928 train_accuracy: 0.316 test_accuracy: 0.313\n",
            "[1,   180] train_loss: 1.888 train_accuracy: 0.311 test_accuracy: 0.313\n",
            "[1,   185] train_loss: 2.000 train_accuracy: 0.313 test_accuracy: 0.313\n",
            "[1,   190] train_loss: 1.840 train_accuracy: 0.318 test_accuracy: 0.320\n",
            "[1,   195] train_loss: 1.884 train_accuracy: 0.325 test_accuracy: 0.323\n",
            "[1,   200] train_loss: 1.870 train_accuracy: 0.317 test_accuracy: 0.318\n",
            "[1,   205] train_loss: 1.925 train_accuracy: 0.334 test_accuracy: 0.328\n",
            "[1,   210] train_loss: 1.852 train_accuracy: 0.311 test_accuracy: 0.315\n",
            "[1,   215] train_loss: 2.045 train_accuracy: 0.315 test_accuracy: 0.310\n",
            "[1,   220] train_loss: 1.951 train_accuracy: 0.325 test_accuracy: 0.319\n",
            "[1,   225] train_loss: 2.061 train_accuracy: 0.304 test_accuracy: 0.296\n",
            "[1,   230] train_loss: 2.004 train_accuracy: 0.305 test_accuracy: 0.300\n",
            "[1,   235] train_loss: 1.970 train_accuracy: 0.319 test_accuracy: 0.306\n",
            "[1,   240] train_loss: 2.005 train_accuracy: 0.319 test_accuracy: 0.317\n",
            "[1,   245] train_loss: 1.923 train_accuracy: 0.293 test_accuracy: 0.290\n",
            "[1,   250] train_loss: 1.860 train_accuracy: 0.324 test_accuracy: 0.325\n",
            "[1,   255] train_loss: 1.957 train_accuracy: 0.329 test_accuracy: 0.327\n",
            "[1,   260] train_loss: 1.910 train_accuracy: 0.308 test_accuracy: 0.312\n",
            "[1,   265] train_loss: 1.932 train_accuracy: 0.309 test_accuracy: 0.308\n",
            "[1,   270] train_loss: 1.835 train_accuracy: 0.315 test_accuracy: 0.316\n",
            "[1,   275] train_loss: 1.905 train_accuracy: 0.312 test_accuracy: 0.315\n",
            "[1,   280] train_loss: 1.831 train_accuracy: 0.306 test_accuracy: 0.302\n",
            "[1,   285] train_loss: 1.878 train_accuracy: 0.327 test_accuracy: 0.321\n",
            "[1,   290] train_loss: 1.914 train_accuracy: 0.323 test_accuracy: 0.317\n",
            "[1,   295] train_loss: 2.003 train_accuracy: 0.332 test_accuracy: 0.322\n",
            "[1,   300] train_loss: 1.928 train_accuracy: 0.321 test_accuracy: 0.307\n",
            "[1,   305] train_loss: 1.831 train_accuracy: 0.328 test_accuracy: 0.323\n",
            "[1,   310] train_loss: 1.846 train_accuracy: 0.311 test_accuracy: 0.308\n",
            "[1,   315] train_loss: 1.982 train_accuracy: 0.322 test_accuracy: 0.321\n",
            "[1,   320] train_loss: 1.816 train_accuracy: 0.328 test_accuracy: 0.325\n",
            "[1,   325] train_loss: 1.889 train_accuracy: 0.329 test_accuracy: 0.326\n",
            "[1,   330] train_loss: 1.752 train_accuracy: 0.341 test_accuracy: 0.336\n",
            "[1,   335] train_loss: 1.934 train_accuracy: 0.338 test_accuracy: 0.333\n",
            "[1,   340] train_loss: 1.872 train_accuracy: 0.322 test_accuracy: 0.314\n",
            "[1,   345] train_loss: 1.829 train_accuracy: 0.334 test_accuracy: 0.327\n",
            "[1,   350] train_loss: 1.904 train_accuracy: 0.323 test_accuracy: 0.316\n",
            "[1,   355] train_loss: 1.982 train_accuracy: 0.334 test_accuracy: 0.334\n",
            "[1,   360] train_loss: 1.884 train_accuracy: 0.311 test_accuracy: 0.312\n",
            "[1,   365] train_loss: 2.037 train_accuracy: 0.336 test_accuracy: 0.329\n",
            "[1,   370] train_loss: 1.896 train_accuracy: 0.336 test_accuracy: 0.333\n",
            "[1,   375] train_loss: 1.936 train_accuracy: 0.337 test_accuracy: 0.328\n",
            "[1,   380] train_loss: 1.968 train_accuracy: 0.317 test_accuracy: 0.303\n",
            "[1,   385] train_loss: 1.908 train_accuracy: 0.338 test_accuracy: 0.339\n",
            "[1,   390] train_loss: 1.926 train_accuracy: 0.341 test_accuracy: 0.340\n",
            "[1,   395] train_loss: 1.814 train_accuracy: 0.314 test_accuracy: 0.306\n",
            "[1,   400] train_loss: 1.902 train_accuracy: 0.339 test_accuracy: 0.333\n",
            "[1,   405] train_loss: 1.924 train_accuracy: 0.329 test_accuracy: 0.326\n",
            "[1,   410] train_loss: 1.864 train_accuracy: 0.328 test_accuracy: 0.320\n",
            "[1,   415] train_loss: 1.856 train_accuracy: 0.336 test_accuracy: 0.339\n",
            "[1,   420] train_loss: 2.050 train_accuracy: 0.326 test_accuracy: 0.333\n",
            "[1,   425] train_loss: 1.922 train_accuracy: 0.328 test_accuracy: 0.324\n",
            "[1,   430] train_loss: 1.935 train_accuracy: 0.340 test_accuracy: 0.330\n",
            "[1,   435] train_loss: 1.843 train_accuracy: 0.355 test_accuracy: 0.350\n",
            "[1,   440] train_loss: 1.882 train_accuracy: 0.322 test_accuracy: 0.324\n",
            "[1,   445] train_loss: 1.836 train_accuracy: 0.348 test_accuracy: 0.346\n",
            "[1,   450] train_loss: 1.787 train_accuracy: 0.344 test_accuracy: 0.337\n",
            "[1,   455] train_loss: 1.953 train_accuracy: 0.335 test_accuracy: 0.332\n",
            "[1,   460] train_loss: 1.914 train_accuracy: 0.347 test_accuracy: 0.345\n",
            "[1,   465] train_loss: 1.867 train_accuracy: 0.343 test_accuracy: 0.339\n",
            "[1,   470] train_loss: 1.828 train_accuracy: 0.351 test_accuracy: 0.349\n",
            "[1,   475] train_loss: 1.891 train_accuracy: 0.345 test_accuracy: 0.343\n",
            "[1,   480] train_loss: 1.857 train_accuracy: 0.341 test_accuracy: 0.334\n",
            "[1,   485] train_loss: 1.795 train_accuracy: 0.363 test_accuracy: 0.342\n",
            "[1,   490] train_loss: 1.801 train_accuracy: 0.342 test_accuracy: 0.332\n",
            "[1,   495] train_loss: 1.931 train_accuracy: 0.354 test_accuracy: 0.347\n",
            "[1,   500] train_loss: 1.778 train_accuracy: 0.341 test_accuracy: 0.330\n",
            "[1,   505] train_loss: 1.877 train_accuracy: 0.311 test_accuracy: 0.302\n",
            "[1,   510] train_loss: 1.735 train_accuracy: 0.328 test_accuracy: 0.328\n",
            "[1,   515] train_loss: 1.944 train_accuracy: 0.325 test_accuracy: 0.320\n",
            "[1,   520] train_loss: 1.855 train_accuracy: 0.327 test_accuracy: 0.309\n",
            "[1,   525] train_loss: 1.939 train_accuracy: 0.339 test_accuracy: 0.327\n",
            "[1,   530] train_loss: 1.972 train_accuracy: 0.335 test_accuracy: 0.331\n",
            "[1,   535] train_loss: 2.080 train_accuracy: 0.319 test_accuracy: 0.321\n",
            "[1,   540] train_loss: 1.849 train_accuracy: 0.323 test_accuracy: 0.309\n",
            "[1,   545] train_loss: 1.960 train_accuracy: 0.347 test_accuracy: 0.333\n",
            "[1,   550] train_loss: 1.812 train_accuracy: 0.337 test_accuracy: 0.333\n",
            "[1,   555] train_loss: 1.876 train_accuracy: 0.315 test_accuracy: 0.313\n",
            "[1,   560] train_loss: 1.900 train_accuracy: 0.343 test_accuracy: 0.329\n",
            "[1,   565] train_loss: 1.836 train_accuracy: 0.329 test_accuracy: 0.324\n",
            "[1,   570] train_loss: 1.752 train_accuracy: 0.316 test_accuracy: 0.311\n",
            "[1,   575] train_loss: 1.935 train_accuracy: 0.347 test_accuracy: 0.344\n",
            "[1,   580] train_loss: 1.854 train_accuracy: 0.344 test_accuracy: 0.338\n",
            "[1,   585] train_loss: 1.879 train_accuracy: 0.350 test_accuracy: 0.341\n",
            "[1,   590] train_loss: 1.749 train_accuracy: 0.336 test_accuracy: 0.326\n",
            "[1,   595] train_loss: 1.811 train_accuracy: 0.356 test_accuracy: 0.348\n",
            "[1,   600] train_loss: 1.808 train_accuracy: 0.339 test_accuracy: 0.337\n",
            "[1,   605] train_loss: 1.773 train_accuracy: 0.356 test_accuracy: 0.354\n",
            "[1,   610] train_loss: 1.777 train_accuracy: 0.357 test_accuracy: 0.353\n",
            "[1,   615] train_loss: 1.844 train_accuracy: 0.340 test_accuracy: 0.330\n",
            "[1,   620] train_loss: 2.012 train_accuracy: 0.346 test_accuracy: 0.329\n",
            "[1,   625] train_loss: 1.911 train_accuracy: 0.357 test_accuracy: 0.349\n",
            "[1,   630] train_loss: 1.911 train_accuracy: 0.355 test_accuracy: 0.344\n",
            "[1,   635] train_loss: 1.917 train_accuracy: 0.348 test_accuracy: 0.344\n",
            "[1,   640] train_loss: 1.763 train_accuracy: 0.357 test_accuracy: 0.347\n",
            "[1,   645] train_loss: 1.804 train_accuracy: 0.332 test_accuracy: 0.322\n",
            "[1,   650] train_loss: 1.835 train_accuracy: 0.354 test_accuracy: 0.351\n",
            "[1,   655] train_loss: 1.841 train_accuracy: 0.323 test_accuracy: 0.320\n",
            "[1,   660] train_loss: 1.953 train_accuracy: 0.362 test_accuracy: 0.355\n",
            "[1,   665] train_loss: 1.791 train_accuracy: 0.356 test_accuracy: 0.347\n",
            "[1,   670] train_loss: 1.765 train_accuracy: 0.350 test_accuracy: 0.337\n",
            "[1,   675] train_loss: 1.907 train_accuracy: 0.344 test_accuracy: 0.330\n",
            "[1,   680] train_loss: 1.945 train_accuracy: 0.335 test_accuracy: 0.334\n",
            "[1,   685] train_loss: 1.897 train_accuracy: 0.342 test_accuracy: 0.335\n",
            "[1,   690] train_loss: 1.861 train_accuracy: 0.354 test_accuracy: 0.344\n",
            "[1,   695] train_loss: 1.892 train_accuracy: 0.366 test_accuracy: 0.357\n",
            "[1,   700] train_loss: 1.874 train_accuracy: 0.362 test_accuracy: 0.354\n",
            "[1,   705] train_loss: 1.770 train_accuracy: 0.363 test_accuracy: 0.359\n",
            "[1,   710] train_loss: 1.848 train_accuracy: 0.353 test_accuracy: 0.350\n",
            "[1,   715] train_loss: 1.835 train_accuracy: 0.366 test_accuracy: 0.354\n",
            "[1,   720] train_loss: 1.732 train_accuracy: 0.344 test_accuracy: 0.345\n",
            "[1,   725] train_loss: 1.757 train_accuracy: 0.340 test_accuracy: 0.341\n",
            "[1,   730] train_loss: 1.844 train_accuracy: 0.350 test_accuracy: 0.348\n",
            "[1,   735] train_loss: 1.770 train_accuracy: 0.350 test_accuracy: 0.344\n",
            "[1,   740] train_loss: 1.896 train_accuracy: 0.363 test_accuracy: 0.355\n",
            "[1,   745] train_loss: 1.735 train_accuracy: 0.343 test_accuracy: 0.337\n",
            "[1,   750] train_loss: 1.910 train_accuracy: 0.359 test_accuracy: 0.347\n",
            "[1,   755] train_loss: 1.831 train_accuracy: 0.335 test_accuracy: 0.326\n",
            "[1,   760] train_loss: 1.922 train_accuracy: 0.336 test_accuracy: 0.330\n",
            "[1,   765] train_loss: 1.820 train_accuracy: 0.342 test_accuracy: 0.340\n",
            "[1,   770] train_loss: 1.832 train_accuracy: 0.334 test_accuracy: 0.332\n",
            "[1,   775] train_loss: 1.909 train_accuracy: 0.340 test_accuracy: 0.323\n",
            "[1,   780] train_loss: 1.937 train_accuracy: 0.361 test_accuracy: 0.348\n",
            "[1,   785] train_loss: 1.820 train_accuracy: 0.357 test_accuracy: 0.352\n",
            "[1,   790] train_loss: 1.822 train_accuracy: 0.363 test_accuracy: 0.358\n",
            "[1,   795] train_loss: 1.852 train_accuracy: 0.368 test_accuracy: 0.356\n",
            "[1,   800] train_loss: 1.757 train_accuracy: 0.358 test_accuracy: 0.354\n",
            "[1,   805] train_loss: 1.776 train_accuracy: 0.356 test_accuracy: 0.350\n",
            "[1,   810] train_loss: 1.855 train_accuracy: 0.338 test_accuracy: 0.329\n",
            "[1,   815] train_loss: 1.917 train_accuracy: 0.338 test_accuracy: 0.327\n",
            "[1,   820] train_loss: 1.929 train_accuracy: 0.345 test_accuracy: 0.330\n",
            "[1,   825] train_loss: 1.838 train_accuracy: 0.363 test_accuracy: 0.353\n",
            "[1,   830] train_loss: 1.828 train_accuracy: 0.362 test_accuracy: 0.364\n",
            "[1,   835] train_loss: 1.860 train_accuracy: 0.353 test_accuracy: 0.349\n",
            "[1,   840] train_loss: 1.806 train_accuracy: 0.350 test_accuracy: 0.337\n",
            "[1,   845] train_loss: 1.809 train_accuracy: 0.342 test_accuracy: 0.334\n",
            "[1,   850] train_loss: 1.915 train_accuracy: 0.364 test_accuracy: 0.350\n",
            "[1,   855] train_loss: 1.942 train_accuracy: 0.359 test_accuracy: 0.343\n",
            "[1,   860] train_loss: 1.766 train_accuracy: 0.365 test_accuracy: 0.344\n",
            "[1,   865] train_loss: 1.843 train_accuracy: 0.366 test_accuracy: 0.349\n",
            "[1,   870] train_loss: 1.671 train_accuracy: 0.357 test_accuracy: 0.342\n",
            "[1,   875] train_loss: 1.800 train_accuracy: 0.334 test_accuracy: 0.334\n",
            "[1,   880] train_loss: 1.801 train_accuracy: 0.346 test_accuracy: 0.341\n",
            "[1,   885] train_loss: 1.875 train_accuracy: 0.343 test_accuracy: 0.335\n",
            "[1,   890] train_loss: 1.835 train_accuracy: 0.348 test_accuracy: 0.336\n",
            "[1,   895] train_loss: 1.944 train_accuracy: 0.360 test_accuracy: 0.348\n",
            "[1,   900] train_loss: 1.799 train_accuracy: 0.354 test_accuracy: 0.344\n",
            "[1,   905] train_loss: 1.832 train_accuracy: 0.358 test_accuracy: 0.345\n",
            "[1,   910] train_loss: 1.840 train_accuracy: 0.351 test_accuracy: 0.348\n",
            "[1,   915] train_loss: 1.877 train_accuracy: 0.347 test_accuracy: 0.338\n",
            "[1,   920] train_loss: 1.763 train_accuracy: 0.338 test_accuracy: 0.329\n",
            "[1,   925] train_loss: 1.888 train_accuracy: 0.369 test_accuracy: 0.356\n",
            "[1,   930] train_loss: 1.895 train_accuracy: 0.369 test_accuracy: 0.358\n",
            "[1,   935] train_loss: 1.797 train_accuracy: 0.369 test_accuracy: 0.357\n",
            "[1,   940] train_loss: 1.806 train_accuracy: 0.359 test_accuracy: 0.348\n",
            "[1,   945] train_loss: 1.894 train_accuracy: 0.362 test_accuracy: 0.351\n",
            "[1,   950] train_loss: 1.756 train_accuracy: 0.354 test_accuracy: 0.347\n",
            "[1,   955] train_loss: 1.788 train_accuracy: 0.362 test_accuracy: 0.357\n",
            "[1,   960] train_loss: 1.814 train_accuracy: 0.355 test_accuracy: 0.350\n",
            "[1,   965] train_loss: 1.909 train_accuracy: 0.354 test_accuracy: 0.351\n",
            "[1,   970] train_loss: 1.796 train_accuracy: 0.360 test_accuracy: 0.349\n",
            "[1,   975] train_loss: 1.735 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[1,   980] train_loss: 1.821 train_accuracy: 0.350 test_accuracy: 0.348\n",
            "[1,   985] train_loss: 1.796 train_accuracy: 0.360 test_accuracy: 0.358\n",
            "[1,   990] train_loss: 1.857 train_accuracy: 0.363 test_accuracy: 0.357\n",
            "[1,   995] train_loss: 1.677 train_accuracy: 0.358 test_accuracy: 0.357\n",
            "[1,  1000] train_loss: 1.739 train_accuracy: 0.357 test_accuracy: 0.355\n",
            "[1,  1005] train_loss: 1.771 train_accuracy: 0.362 test_accuracy: 0.350\n",
            "[1,  1010] train_loss: 1.849 train_accuracy: 0.347 test_accuracy: 0.336\n",
            "[1,  1015] train_loss: 1.884 train_accuracy: 0.353 test_accuracy: 0.342\n",
            "[1,  1020] train_loss: 1.818 train_accuracy: 0.344 test_accuracy: 0.338\n",
            "[1,  1025] train_loss: 1.797 train_accuracy: 0.356 test_accuracy: 0.345\n",
            "[1,  1030] train_loss: 1.965 train_accuracy: 0.374 test_accuracy: 0.361\n",
            "[1,  1035] train_loss: 1.854 train_accuracy: 0.348 test_accuracy: 0.338\n",
            "[1,  1040] train_loss: 1.743 train_accuracy: 0.358 test_accuracy: 0.348\n",
            "[1,  1045] train_loss: 1.868 train_accuracy: 0.370 test_accuracy: 0.356\n",
            "[1,  1050] train_loss: 1.819 train_accuracy: 0.366 test_accuracy: 0.353\n",
            "[1,  1055] train_loss: 1.854 train_accuracy: 0.351 test_accuracy: 0.344\n",
            "[1,  1060] train_loss: 1.934 train_accuracy: 0.329 test_accuracy: 0.325\n",
            "[1,  1065] train_loss: 1.743 train_accuracy: 0.362 test_accuracy: 0.356\n",
            "[1,  1070] train_loss: 1.720 train_accuracy: 0.369 test_accuracy: 0.360\n",
            "[1,  1075] train_loss: 1.925 train_accuracy: 0.370 test_accuracy: 0.360\n",
            "[1,  1080] train_loss: 1.845 train_accuracy: 0.357 test_accuracy: 0.356\n",
            "[1,  1085] train_loss: 1.822 train_accuracy: 0.365 test_accuracy: 0.360\n",
            "[1,  1090] train_loss: 1.828 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[1,  1095] train_loss: 1.880 train_accuracy: 0.371 test_accuracy: 0.363\n",
            "[1,  1100] train_loss: 1.808 train_accuracy: 0.368 test_accuracy: 0.368\n",
            "[1,  1105] train_loss: 1.907 train_accuracy: 0.370 test_accuracy: 0.365\n",
            "[1,  1110] train_loss: 1.768 train_accuracy: 0.369 test_accuracy: 0.372\n",
            "[1,  1115] train_loss: 1.828 train_accuracy: 0.362 test_accuracy: 0.363\n",
            "[1,  1120] train_loss: 1.808 train_accuracy: 0.350 test_accuracy: 0.350\n",
            "[1,  1125] train_loss: 1.920 train_accuracy: 0.369 test_accuracy: 0.362\n",
            "[1,  1130] train_loss: 1.686 train_accuracy: 0.357 test_accuracy: 0.349\n",
            "[1,  1135] train_loss: 1.750 train_accuracy: 0.359 test_accuracy: 0.353\n",
            "[1,  1140] train_loss: 1.857 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[1,  1145] train_loss: 1.828 train_accuracy: 0.378 test_accuracy: 0.369\n",
            "[1,  1150] train_loss: 1.882 train_accuracy: 0.359 test_accuracy: 0.351\n",
            "[1,  1155] train_loss: 1.739 train_accuracy: 0.359 test_accuracy: 0.355\n",
            "[1,  1160] train_loss: 1.875 train_accuracy: 0.368 test_accuracy: 0.367\n",
            "[1,  1165] train_loss: 1.830 train_accuracy: 0.370 test_accuracy: 0.361\n",
            "[1,  1170] train_loss: 1.893 train_accuracy: 0.368 test_accuracy: 0.366\n",
            "[1,  1175] train_loss: 1.828 train_accuracy: 0.383 test_accuracy: 0.372\n",
            "[1,  1180] train_loss: 1.873 train_accuracy: 0.376 test_accuracy: 0.362\n",
            "[1,  1185] train_loss: 1.737 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[1,  1190] train_loss: 1.818 train_accuracy: 0.369 test_accuracy: 0.359\n",
            "[1,  1195] train_loss: 1.811 train_accuracy: 0.374 test_accuracy: 0.364\n",
            "[1,  1200] train_loss: 1.797 train_accuracy: 0.373 test_accuracy: 0.364\n",
            "[1,  1205] train_loss: 1.798 train_accuracy: 0.369 test_accuracy: 0.360\n",
            "[1,  1210] train_loss: 1.852 train_accuracy: 0.360 test_accuracy: 0.361\n",
            "[1,  1215] train_loss: 1.823 train_accuracy: 0.369 test_accuracy: 0.370\n",
            "[1,  1220] train_loss: 1.800 train_accuracy: 0.371 test_accuracy: 0.368\n",
            "[1,  1225] train_loss: 1.723 train_accuracy: 0.373 test_accuracy: 0.369\n",
            "[1,  1230] train_loss: 1.924 train_accuracy: 0.365 test_accuracy: 0.359\n",
            "[1,  1235] train_loss: 1.899 train_accuracy: 0.354 test_accuracy: 0.348\n",
            "[1,  1240] train_loss: 1.883 train_accuracy: 0.373 test_accuracy: 0.365\n",
            "[1,  1245] train_loss: 1.900 train_accuracy: 0.384 test_accuracy: 0.371\n",
            "[2,     5] train_loss: 1.768 train_accuracy: 0.370 test_accuracy: 0.358\n",
            "[2,    10] train_loss: 1.686 train_accuracy: 0.369 test_accuracy: 0.361\n",
            "[2,    15] train_loss: 1.737 train_accuracy: 0.370 test_accuracy: 0.366\n",
            "[2,    20] train_loss: 1.750 train_accuracy: 0.369 test_accuracy: 0.359\n",
            "[2,    25] train_loss: 1.887 train_accuracy: 0.372 test_accuracy: 0.358\n",
            "[2,    30] train_loss: 1.660 train_accuracy: 0.371 test_accuracy: 0.355\n",
            "[2,    35] train_loss: 1.845 train_accuracy: 0.374 test_accuracy: 0.364\n",
            "[2,    40] train_loss: 1.760 train_accuracy: 0.364 test_accuracy: 0.363\n",
            "[2,    45] train_loss: 1.849 train_accuracy: 0.372 test_accuracy: 0.365\n",
            "[2,    50] train_loss: 1.846 train_accuracy: 0.391 test_accuracy: 0.368\n",
            "[2,    55] train_loss: 1.842 train_accuracy: 0.377 test_accuracy: 0.358\n",
            "[2,    60] train_loss: 1.798 train_accuracy: 0.360 test_accuracy: 0.347\n",
            "[2,    65] train_loss: 1.849 train_accuracy: 0.354 test_accuracy: 0.348\n",
            "[2,    70] train_loss: 1.759 train_accuracy: 0.359 test_accuracy: 0.354\n",
            "[2,    75] train_loss: 1.801 train_accuracy: 0.373 test_accuracy: 0.366\n",
            "[2,    80] train_loss: 1.832 train_accuracy: 0.371 test_accuracy: 0.360\n",
            "[2,    85] train_loss: 1.774 train_accuracy: 0.376 test_accuracy: 0.367\n",
            "[2,    90] train_loss: 1.771 train_accuracy: 0.360 test_accuracy: 0.351\n",
            "[2,    95] train_loss: 1.816 train_accuracy: 0.365 test_accuracy: 0.357\n",
            "[2,   100] train_loss: 1.734 train_accuracy: 0.372 test_accuracy: 0.367\n",
            "[2,   105] train_loss: 1.732 train_accuracy: 0.372 test_accuracy: 0.363\n",
            "[2,   110] train_loss: 1.708 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[2,   115] train_loss: 1.893 train_accuracy: 0.359 test_accuracy: 0.349\n",
            "[2,   120] train_loss: 1.837 train_accuracy: 0.360 test_accuracy: 0.351\n",
            "[2,   125] train_loss: 1.897 train_accuracy: 0.368 test_accuracy: 0.360\n",
            "[2,   130] train_loss: 1.831 train_accuracy: 0.348 test_accuracy: 0.346\n",
            "[2,   135] train_loss: 1.778 train_accuracy: 0.360 test_accuracy: 0.354\n",
            "[2,   140] train_loss: 1.758 train_accuracy: 0.358 test_accuracy: 0.353\n",
            "[2,   145] train_loss: 1.777 train_accuracy: 0.364 test_accuracy: 0.350\n",
            "[2,   150] train_loss: 1.768 train_accuracy: 0.375 test_accuracy: 0.365\n",
            "[2,   155] train_loss: 1.748 train_accuracy: 0.367 test_accuracy: 0.363\n",
            "[2,   160] train_loss: 1.803 train_accuracy: 0.361 test_accuracy: 0.355\n",
            "[2,   165] train_loss: 1.835 train_accuracy: 0.362 test_accuracy: 0.355\n",
            "[2,   170] train_loss: 1.871 train_accuracy: 0.375 test_accuracy: 0.362\n",
            "[2,   175] train_loss: 1.815 train_accuracy: 0.357 test_accuracy: 0.348\n",
            "[2,   180] train_loss: 1.796 train_accuracy: 0.380 test_accuracy: 0.369\n",
            "[2,   185] train_loss: 1.771 train_accuracy: 0.374 test_accuracy: 0.364\n",
            "[2,   190] train_loss: 1.902 train_accuracy: 0.387 test_accuracy: 0.372\n",
            "[2,   195] train_loss: 1.920 train_accuracy: 0.376 test_accuracy: 0.370\n",
            "[2,   200] train_loss: 1.772 train_accuracy: 0.376 test_accuracy: 0.360\n",
            "[2,   205] train_loss: 1.799 train_accuracy: 0.368 test_accuracy: 0.358\n",
            "[2,   210] train_loss: 1.850 train_accuracy: 0.370 test_accuracy: 0.364\n",
            "[2,   215] train_loss: 1.838 train_accuracy: 0.383 test_accuracy: 0.379\n",
            "[2,   220] train_loss: 1.783 train_accuracy: 0.376 test_accuracy: 0.365\n",
            "[2,   225] train_loss: 1.871 train_accuracy: 0.365 test_accuracy: 0.355\n",
            "[2,   230] train_loss: 1.843 train_accuracy: 0.365 test_accuracy: 0.355\n",
            "[2,   235] train_loss: 1.811 train_accuracy: 0.379 test_accuracy: 0.366\n",
            "[2,   240] train_loss: 1.770 train_accuracy: 0.378 test_accuracy: 0.361\n",
            "[2,   245] train_loss: 1.803 train_accuracy: 0.369 test_accuracy: 0.354\n",
            "[2,   250] train_loss: 1.801 train_accuracy: 0.368 test_accuracy: 0.357\n",
            "[2,   255] train_loss: 1.811 train_accuracy: 0.380 test_accuracy: 0.366\n",
            "[2,   260] train_loss: 1.877 train_accuracy: 0.374 test_accuracy: 0.365\n",
            "[2,   265] train_loss: 1.758 train_accuracy: 0.346 test_accuracy: 0.335\n",
            "[2,   270] train_loss: 1.800 train_accuracy: 0.351 test_accuracy: 0.332\n",
            "[2,   275] train_loss: 1.730 train_accuracy: 0.356 test_accuracy: 0.342\n",
            "[2,   280] train_loss: 1.925 train_accuracy: 0.369 test_accuracy: 0.348\n",
            "[2,   285] train_loss: 1.815 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[2,   290] train_loss: 1.722 train_accuracy: 0.363 test_accuracy: 0.357\n",
            "[2,   295] train_loss: 1.864 train_accuracy: 0.344 test_accuracy: 0.335\n",
            "[2,   300] train_loss: 1.767 train_accuracy: 0.368 test_accuracy: 0.354\n",
            "[2,   305] train_loss: 1.750 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[2,   310] train_loss: 1.775 train_accuracy: 0.360 test_accuracy: 0.340\n",
            "[2,   315] train_loss: 1.901 train_accuracy: 0.355 test_accuracy: 0.338\n",
            "[2,   320] train_loss: 1.688 train_accuracy: 0.360 test_accuracy: 0.349\n",
            "[2,   325] train_loss: 1.837 train_accuracy: 0.355 test_accuracy: 0.352\n",
            "[2,   330] train_loss: 1.895 train_accuracy: 0.363 test_accuracy: 0.354\n",
            "[2,   335] train_loss: 1.775 train_accuracy: 0.380 test_accuracy: 0.368\n",
            "[2,   340] train_loss: 1.716 train_accuracy: 0.373 test_accuracy: 0.360\n",
            "[2,   345] train_loss: 1.851 train_accuracy: 0.384 test_accuracy: 0.363\n",
            "[2,   350] train_loss: 1.838 train_accuracy: 0.361 test_accuracy: 0.348\n",
            "[2,   355] train_loss: 1.840 train_accuracy: 0.357 test_accuracy: 0.345\n",
            "[2,   360] train_loss: 1.791 train_accuracy: 0.371 test_accuracy: 0.357\n",
            "[2,   365] train_loss: 1.671 train_accuracy: 0.373 test_accuracy: 0.356\n",
            "[2,   370] train_loss: 1.809 train_accuracy: 0.376 test_accuracy: 0.366\n",
            "[2,   375] train_loss: 1.772 train_accuracy: 0.362 test_accuracy: 0.354\n",
            "[2,   380] train_loss: 1.810 train_accuracy: 0.354 test_accuracy: 0.345\n",
            "[2,   385] train_loss: 1.733 train_accuracy: 0.376 test_accuracy: 0.368\n",
            "[2,   390] train_loss: 1.716 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[2,   395] train_loss: 1.678 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,   400] train_loss: 1.717 train_accuracy: 0.373 test_accuracy: 0.359\n",
            "[2,   405] train_loss: 1.820 train_accuracy: 0.378 test_accuracy: 0.368\n",
            "[2,   410] train_loss: 1.643 train_accuracy: 0.360 test_accuracy: 0.347\n",
            "[2,   415] train_loss: 1.858 train_accuracy: 0.378 test_accuracy: 0.369\n",
            "[2,   420] train_loss: 1.924 train_accuracy: 0.360 test_accuracy: 0.355\n",
            "[2,   425] train_loss: 1.762 train_accuracy: 0.360 test_accuracy: 0.352\n",
            "[2,   430] train_loss: 1.794 train_accuracy: 0.350 test_accuracy: 0.348\n",
            "[2,   435] train_loss: 1.813 train_accuracy: 0.358 test_accuracy: 0.355\n",
            "[2,   440] train_loss: 1.822 train_accuracy: 0.376 test_accuracy: 0.361\n",
            "[2,   445] train_loss: 1.736 train_accuracy: 0.364 test_accuracy: 0.350\n",
            "[2,   450] train_loss: 1.808 train_accuracy: 0.382 test_accuracy: 0.369\n",
            "[2,   455] train_loss: 1.728 train_accuracy: 0.373 test_accuracy: 0.366\n",
            "[2,   460] train_loss: 1.749 train_accuracy: 0.377 test_accuracy: 0.366\n",
            "[2,   465] train_loss: 1.916 train_accuracy: 0.366 test_accuracy: 0.349\n",
            "[2,   470] train_loss: 1.816 train_accuracy: 0.369 test_accuracy: 0.356\n",
            "[2,   475] train_loss: 1.709 train_accuracy: 0.378 test_accuracy: 0.368\n",
            "[2,   480] train_loss: 1.902 train_accuracy: 0.366 test_accuracy: 0.365\n",
            "[2,   485] train_loss: 1.756 train_accuracy: 0.382 test_accuracy: 0.366\n",
            "[2,   490] train_loss: 1.827 train_accuracy: 0.384 test_accuracy: 0.361\n",
            "[2,   495] train_loss: 1.935 train_accuracy: 0.375 test_accuracy: 0.364\n",
            "[2,   500] train_loss: 1.738 train_accuracy: 0.359 test_accuracy: 0.348\n",
            "[2,   505] train_loss: 1.848 train_accuracy: 0.357 test_accuracy: 0.347\n",
            "[2,   510] train_loss: 1.858 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[2,   515] train_loss: 1.756 train_accuracy: 0.372 test_accuracy: 0.359\n",
            "[2,   520] train_loss: 1.786 train_accuracy: 0.374 test_accuracy: 0.360\n",
            "[2,   525] train_loss: 1.788 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[2,   530] train_loss: 1.852 train_accuracy: 0.373 test_accuracy: 0.360\n",
            "[2,   535] train_loss: 1.755 train_accuracy: 0.377 test_accuracy: 0.365\n",
            "[2,   540] train_loss: 1.832 train_accuracy: 0.381 test_accuracy: 0.367\n",
            "[2,   545] train_loss: 1.778 train_accuracy: 0.387 test_accuracy: 0.369\n",
            "[2,   550] train_loss: 1.807 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[2,   555] train_loss: 1.756 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[2,   560] train_loss: 1.800 train_accuracy: 0.352 test_accuracy: 0.340\n",
            "[2,   565] train_loss: 1.758 train_accuracy: 0.368 test_accuracy: 0.355\n",
            "[2,   570] train_loss: 1.713 train_accuracy: 0.377 test_accuracy: 0.364\n",
            "[2,   575] train_loss: 1.799 train_accuracy: 0.371 test_accuracy: 0.356\n",
            "[2,   580] train_loss: 1.747 train_accuracy: 0.373 test_accuracy: 0.363\n",
            "[2,   585] train_loss: 1.823 train_accuracy: 0.386 test_accuracy: 0.377\n",
            "[2,   590] train_loss: 1.799 train_accuracy: 0.388 test_accuracy: 0.378\n",
            "[2,   595] train_loss: 1.800 train_accuracy: 0.382 test_accuracy: 0.367\n",
            "[2,   600] train_loss: 1.804 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[2,   605] train_loss: 1.880 train_accuracy: 0.368 test_accuracy: 0.366\n",
            "[2,   610] train_loss: 1.735 train_accuracy: 0.385 test_accuracy: 0.372\n",
            "[2,   615] train_loss: 1.716 train_accuracy: 0.378 test_accuracy: 0.361\n",
            "[2,   620] train_loss: 1.648 train_accuracy: 0.375 test_accuracy: 0.353\n",
            "[2,   625] train_loss: 1.773 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[2,   630] train_loss: 1.732 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[2,   635] train_loss: 1.744 train_accuracy: 0.376 test_accuracy: 0.369\n",
            "[2,   640] train_loss: 1.811 train_accuracy: 0.382 test_accuracy: 0.371\n",
            "[2,   645] train_loss: 1.848 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[2,   650] train_loss: 1.786 train_accuracy: 0.392 test_accuracy: 0.374\n",
            "[2,   655] train_loss: 1.823 train_accuracy: 0.385 test_accuracy: 0.369\n",
            "[2,   660] train_loss: 1.851 train_accuracy: 0.360 test_accuracy: 0.352\n",
            "[2,   665] train_loss: 1.952 train_accuracy: 0.372 test_accuracy: 0.357\n",
            "[2,   670] train_loss: 1.869 train_accuracy: 0.376 test_accuracy: 0.365\n",
            "[2,   675] train_loss: 1.824 train_accuracy: 0.385 test_accuracy: 0.376\n",
            "[2,   680] train_loss: 1.773 train_accuracy: 0.389 test_accuracy: 0.378\n",
            "[2,   685] train_loss: 1.725 train_accuracy: 0.385 test_accuracy: 0.376\n",
            "[2,   690] train_loss: 1.607 train_accuracy: 0.378 test_accuracy: 0.367\n",
            "[2,   695] train_loss: 1.680 train_accuracy: 0.383 test_accuracy: 0.369\n",
            "[2,   700] train_loss: 1.964 train_accuracy: 0.391 test_accuracy: 0.381\n",
            "[2,   705] train_loss: 1.711 train_accuracy: 0.368 test_accuracy: 0.361\n",
            "[2,   710] train_loss: 1.796 train_accuracy: 0.382 test_accuracy: 0.367\n",
            "[2,   715] train_loss: 1.838 train_accuracy: 0.374 test_accuracy: 0.359\n",
            "[2,   720] train_loss: 1.797 train_accuracy: 0.334 test_accuracy: 0.326\n",
            "[2,   725] train_loss: 1.859 train_accuracy: 0.369 test_accuracy: 0.357\n",
            "[2,   730] train_loss: 1.884 train_accuracy: 0.374 test_accuracy: 0.358\n",
            "[2,   735] train_loss: 1.828 train_accuracy: 0.376 test_accuracy: 0.363\n",
            "[2,   740] train_loss: 1.785 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[2,   745] train_loss: 1.762 train_accuracy: 0.377 test_accuracy: 0.365\n",
            "[2,   750] train_loss: 1.818 train_accuracy: 0.354 test_accuracy: 0.344\n",
            "[2,   755] train_loss: 1.761 train_accuracy: 0.359 test_accuracy: 0.347\n",
            "[2,   760] train_loss: 1.756 train_accuracy: 0.366 test_accuracy: 0.350\n",
            "[2,   765] train_loss: 1.741 train_accuracy: 0.389 test_accuracy: 0.364\n",
            "[2,   770] train_loss: 1.815 train_accuracy: 0.389 test_accuracy: 0.365\n",
            "[2,   775] train_loss: 1.804 train_accuracy: 0.364 test_accuracy: 0.355\n",
            "[2,   780] train_loss: 1.706 train_accuracy: 0.378 test_accuracy: 0.368\n",
            "[2,   785] train_loss: 1.697 train_accuracy: 0.374 test_accuracy: 0.359\n",
            "[2,   790] train_loss: 1.939 train_accuracy: 0.380 test_accuracy: 0.371\n",
            "[2,   795] train_loss: 1.867 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[2,   800] train_loss: 1.764 train_accuracy: 0.385 test_accuracy: 0.376\n",
            "[2,   805] train_loss: 1.758 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[2,   810] train_loss: 1.868 train_accuracy: 0.371 test_accuracy: 0.360\n",
            "[2,   815] train_loss: 1.827 train_accuracy: 0.382 test_accuracy: 0.369\n",
            "[2,   820] train_loss: 1.788 train_accuracy: 0.370 test_accuracy: 0.360\n",
            "[2,   825] train_loss: 1.830 train_accuracy: 0.377 test_accuracy: 0.363\n",
            "[2,   830] train_loss: 1.864 train_accuracy: 0.361 test_accuracy: 0.350\n",
            "[2,   835] train_loss: 1.878 train_accuracy: 0.375 test_accuracy: 0.356\n",
            "[2,   840] train_loss: 1.727 train_accuracy: 0.363 test_accuracy: 0.347\n",
            "[2,   845] train_loss: 1.856 train_accuracy: 0.387 test_accuracy: 0.368\n",
            "[2,   850] train_loss: 1.791 train_accuracy: 0.381 test_accuracy: 0.375\n",
            "[2,   855] train_loss: 1.781 train_accuracy: 0.371 test_accuracy: 0.357\n",
            "[2,   860] train_loss: 1.730 train_accuracy: 0.368 test_accuracy: 0.355\n",
            "[2,   865] train_loss: 1.766 train_accuracy: 0.375 test_accuracy: 0.367\n",
            "[2,   870] train_loss: 1.790 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[2,   875] train_loss: 1.776 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[2,   880] train_loss: 1.697 train_accuracy: 0.377 test_accuracy: 0.362\n",
            "[2,   885] train_loss: 1.854 train_accuracy: 0.370 test_accuracy: 0.351\n",
            "[2,   890] train_loss: 1.838 train_accuracy: 0.376 test_accuracy: 0.355\n",
            "[2,   895] train_loss: 1.916 train_accuracy: 0.364 test_accuracy: 0.350\n",
            "[2,   900] train_loss: 1.751 train_accuracy: 0.361 test_accuracy: 0.348\n",
            "[2,   905] train_loss: 1.895 train_accuracy: 0.383 test_accuracy: 0.366\n",
            "[2,   910] train_loss: 1.884 train_accuracy: 0.367 test_accuracy: 0.347\n",
            "[2,   915] train_loss: 1.845 train_accuracy: 0.372 test_accuracy: 0.360\n",
            "[2,   920] train_loss: 1.766 train_accuracy: 0.372 test_accuracy: 0.365\n",
            "[2,   925] train_loss: 1.830 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[2,   930] train_loss: 1.812 train_accuracy: 0.372 test_accuracy: 0.351\n",
            "[2,   935] train_loss: 1.795 train_accuracy: 0.376 test_accuracy: 0.359\n",
            "[2,   940] train_loss: 1.919 train_accuracy: 0.374 test_accuracy: 0.363\n",
            "[2,   945] train_loss: 1.734 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,   950] train_loss: 1.813 train_accuracy: 0.384 test_accuracy: 0.371\n",
            "[2,   955] train_loss: 1.701 train_accuracy: 0.374 test_accuracy: 0.358\n",
            "[2,   960] train_loss: 1.855 train_accuracy: 0.382 test_accuracy: 0.372\n",
            "[2,   965] train_loss: 1.760 train_accuracy: 0.362 test_accuracy: 0.352\n",
            "[2,   970] train_loss: 1.780 train_accuracy: 0.388 test_accuracy: 0.371\n",
            "[2,   975] train_loss: 1.883 train_accuracy: 0.385 test_accuracy: 0.367\n",
            "[2,   980] train_loss: 1.731 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[2,   985] train_loss: 1.732 train_accuracy: 0.368 test_accuracy: 0.354\n",
            "[2,   990] train_loss: 1.801 train_accuracy: 0.378 test_accuracy: 0.360\n",
            "[2,   995] train_loss: 1.744 train_accuracy: 0.387 test_accuracy: 0.365\n",
            "[2,  1000] train_loss: 1.860 train_accuracy: 0.380 test_accuracy: 0.361\n",
            "[2,  1005] train_loss: 1.736 train_accuracy: 0.378 test_accuracy: 0.360\n",
            "[2,  1010] train_loss: 1.721 train_accuracy: 0.388 test_accuracy: 0.368\n",
            "[2,  1015] train_loss: 1.790 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[2,  1020] train_loss: 1.871 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[2,  1025] train_loss: 1.711 train_accuracy: 0.384 test_accuracy: 0.377\n",
            "[2,  1030] train_loss: 1.727 train_accuracy: 0.388 test_accuracy: 0.375\n",
            "[2,  1035] train_loss: 1.699 train_accuracy: 0.388 test_accuracy: 0.374\n",
            "[2,  1040] train_loss: 1.707 train_accuracy: 0.389 test_accuracy: 0.379\n",
            "[2,  1045] train_loss: 1.611 train_accuracy: 0.381 test_accuracy: 0.377\n",
            "[2,  1050] train_loss: 1.724 train_accuracy: 0.383 test_accuracy: 0.374\n",
            "[2,  1055] train_loss: 1.730 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[2,  1060] train_loss: 1.777 train_accuracy: 0.396 test_accuracy: 0.376\n",
            "[2,  1065] train_loss: 1.786 train_accuracy: 0.391 test_accuracy: 0.375\n",
            "[2,  1070] train_loss: 1.698 train_accuracy: 0.376 test_accuracy: 0.361\n",
            "[2,  1075] train_loss: 1.744 train_accuracy: 0.387 test_accuracy: 0.374\n",
            "[2,  1080] train_loss: 1.840 train_accuracy: 0.386 test_accuracy: 0.374\n",
            "[2,  1085] train_loss: 1.843 train_accuracy: 0.391 test_accuracy: 0.372\n",
            "[2,  1090] train_loss: 1.763 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[2,  1095] train_loss: 1.761 train_accuracy: 0.388 test_accuracy: 0.372\n",
            "[2,  1100] train_loss: 1.777 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[2,  1105] train_loss: 1.777 train_accuracy: 0.397 test_accuracy: 0.374\n",
            "[2,  1110] train_loss: 1.823 train_accuracy: 0.391 test_accuracy: 0.367\n",
            "[2,  1115] train_loss: 1.719 train_accuracy: 0.379 test_accuracy: 0.362\n",
            "[2,  1120] train_loss: 1.670 train_accuracy: 0.379 test_accuracy: 0.366\n",
            "[2,  1125] train_loss: 1.773 train_accuracy: 0.390 test_accuracy: 0.380\n",
            "[2,  1130] train_loss: 1.746 train_accuracy: 0.366 test_accuracy: 0.359\n",
            "[2,  1135] train_loss: 1.708 train_accuracy: 0.385 test_accuracy: 0.368\n",
            "[2,  1140] train_loss: 1.831 train_accuracy: 0.389 test_accuracy: 0.370\n",
            "[2,  1145] train_loss: 1.812 train_accuracy: 0.383 test_accuracy: 0.369\n",
            "[2,  1150] train_loss: 1.719 train_accuracy: 0.384 test_accuracy: 0.366\n",
            "[2,  1155] train_loss: 1.788 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[2,  1160] train_loss: 1.745 train_accuracy: 0.385 test_accuracy: 0.363\n",
            "[2,  1165] train_loss: 1.846 train_accuracy: 0.379 test_accuracy: 0.364\n",
            "[2,  1170] train_loss: 1.854 train_accuracy: 0.377 test_accuracy: 0.366\n",
            "[2,  1175] train_loss: 1.942 train_accuracy: 0.372 test_accuracy: 0.358\n",
            "[2,  1180] train_loss: 1.775 train_accuracy: 0.371 test_accuracy: 0.354\n",
            "[2,  1185] train_loss: 1.847 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[2,  1190] train_loss: 1.780 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[2,  1195] train_loss: 1.762 train_accuracy: 0.387 test_accuracy: 0.364\n",
            "[2,  1200] train_loss: 1.851 train_accuracy: 0.383 test_accuracy: 0.361\n",
            "[2,  1205] train_loss: 1.795 train_accuracy: 0.383 test_accuracy: 0.366\n",
            "[2,  1210] train_loss: 1.801 train_accuracy: 0.386 test_accuracy: 0.376\n",
            "[2,  1215] train_loss: 1.645 train_accuracy: 0.387 test_accuracy: 0.369\n",
            "[2,  1220] train_loss: 1.793 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[2,  1225] train_loss: 1.738 train_accuracy: 0.390 test_accuracy: 0.379\n",
            "[2,  1230] train_loss: 1.758 train_accuracy: 0.390 test_accuracy: 0.380\n",
            "[2,  1235] train_loss: 1.743 train_accuracy: 0.386 test_accuracy: 0.372\n",
            "[2,  1240] train_loss: 1.858 train_accuracy: 0.391 test_accuracy: 0.370\n",
            "[2,  1245] train_loss: 1.731 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[3,     5] train_loss: 1.792 train_accuracy: 0.385 test_accuracy: 0.369\n",
            "[3,    10] train_loss: 1.955 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[3,    15] train_loss: 1.782 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[3,    20] train_loss: 1.647 train_accuracy: 0.385 test_accuracy: 0.370\n",
            "[3,    25] train_loss: 1.660 train_accuracy: 0.381 test_accuracy: 0.370\n",
            "[3,    30] train_loss: 1.829 train_accuracy: 0.378 test_accuracy: 0.366\n",
            "[3,    35] train_loss: 1.756 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[3,    40] train_loss: 1.847 train_accuracy: 0.361 test_accuracy: 0.345\n",
            "[3,    45] train_loss: 1.767 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[3,    50] train_loss: 1.804 train_accuracy: 0.378 test_accuracy: 0.370\n",
            "[3,    55] train_loss: 1.789 train_accuracy: 0.376 test_accuracy: 0.364\n",
            "[3,    60] train_loss: 1.724 train_accuracy: 0.366 test_accuracy: 0.354\n",
            "[3,    65] train_loss: 1.796 train_accuracy: 0.379 test_accuracy: 0.363\n",
            "[3,    70] train_loss: 1.826 train_accuracy: 0.378 test_accuracy: 0.363\n",
            "[3,    75] train_loss: 1.723 train_accuracy: 0.374 test_accuracy: 0.360\n",
            "[3,    80] train_loss: 1.624 train_accuracy: 0.366 test_accuracy: 0.354\n",
            "[3,    85] train_loss: 1.860 train_accuracy: 0.373 test_accuracy: 0.358\n",
            "[3,    90] train_loss: 1.878 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[3,    95] train_loss: 1.731 train_accuracy: 0.382 test_accuracy: 0.362\n",
            "[3,   100] train_loss: 1.737 train_accuracy: 0.382 test_accuracy: 0.365\n",
            "[3,   105] train_loss: 1.672 train_accuracy: 0.385 test_accuracy: 0.372\n",
            "[3,   110] train_loss: 1.956 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   115] train_loss: 1.845 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[3,   120] train_loss: 1.804 train_accuracy: 0.380 test_accuracy: 0.372\n",
            "[3,   125] train_loss: 1.708 train_accuracy: 0.384 test_accuracy: 0.373\n",
            "[3,   130] train_loss: 1.772 train_accuracy: 0.390 test_accuracy: 0.375\n",
            "[3,   135] train_loss: 1.680 train_accuracy: 0.384 test_accuracy: 0.371\n",
            "[3,   140] train_loss: 1.717 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[3,   145] train_loss: 1.780 train_accuracy: 0.393 test_accuracy: 0.381\n",
            "[3,   150] train_loss: 1.757 train_accuracy: 0.395 test_accuracy: 0.383\n",
            "[3,   155] train_loss: 1.620 train_accuracy: 0.395 test_accuracy: 0.376\n",
            "[3,   160] train_loss: 1.828 train_accuracy: 0.384 test_accuracy: 0.366\n",
            "[3,   165] train_loss: 1.742 train_accuracy: 0.373 test_accuracy: 0.355\n",
            "[3,   170] train_loss: 1.707 train_accuracy: 0.361 test_accuracy: 0.350\n",
            "[3,   175] train_loss: 1.716 train_accuracy: 0.381 test_accuracy: 0.370\n",
            "[3,   180] train_loss: 1.827 train_accuracy: 0.388 test_accuracy: 0.370\n",
            "[3,   185] train_loss: 1.830 train_accuracy: 0.370 test_accuracy: 0.359\n",
            "[3,   190] train_loss: 1.761 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[3,   195] train_loss: 1.902 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[3,   200] train_loss: 1.771 train_accuracy: 0.385 test_accuracy: 0.366\n",
            "[3,   205] train_loss: 1.795 train_accuracy: 0.377 test_accuracy: 0.369\n",
            "[3,   210] train_loss: 1.741 train_accuracy: 0.365 test_accuracy: 0.352\n",
            "[3,   215] train_loss: 1.816 train_accuracy: 0.384 test_accuracy: 0.367\n",
            "[3,   220] train_loss: 1.654 train_accuracy: 0.391 test_accuracy: 0.373\n",
            "[3,   225] train_loss: 1.744 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[3,   230] train_loss: 1.849 train_accuracy: 0.386 test_accuracy: 0.366\n",
            "[3,   235] train_loss: 1.864 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[3,   240] train_loss: 1.750 train_accuracy: 0.375 test_accuracy: 0.366\n",
            "[3,   245] train_loss: 1.781 train_accuracy: 0.383 test_accuracy: 0.372\n",
            "[3,   250] train_loss: 1.818 train_accuracy: 0.392 test_accuracy: 0.379\n",
            "[3,   255] train_loss: 1.766 train_accuracy: 0.385 test_accuracy: 0.375\n",
            "[3,   260] train_loss: 1.755 train_accuracy: 0.385 test_accuracy: 0.373\n",
            "[3,   265] train_loss: 1.715 train_accuracy: 0.376 test_accuracy: 0.360\n",
            "[3,   270] train_loss: 1.806 train_accuracy: 0.371 test_accuracy: 0.355\n",
            "[3,   275] train_loss: 1.768 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   280] train_loss: 1.799 train_accuracy: 0.394 test_accuracy: 0.380\n",
            "[3,   285] train_loss: 1.662 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[3,   290] train_loss: 1.741 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[3,   295] train_loss: 1.658 train_accuracy: 0.387 test_accuracy: 0.376\n",
            "[3,   300] train_loss: 1.742 train_accuracy: 0.391 test_accuracy: 0.373\n",
            "[3,   305] train_loss: 1.747 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[3,   310] train_loss: 1.774 train_accuracy: 0.383 test_accuracy: 0.362\n",
            "[3,   315] train_loss: 1.768 train_accuracy: 0.391 test_accuracy: 0.373\n",
            "[3,   320] train_loss: 1.693 train_accuracy: 0.389 test_accuracy: 0.373\n",
            "[3,   325] train_loss: 1.875 train_accuracy: 0.389 test_accuracy: 0.362\n",
            "[3,   330] train_loss: 1.819 train_accuracy: 0.393 test_accuracy: 0.363\n",
            "[3,   335] train_loss: 1.772 train_accuracy: 0.390 test_accuracy: 0.367\n",
            "[3,   340] train_loss: 1.852 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[3,   345] train_loss: 1.886 train_accuracy: 0.392 test_accuracy: 0.370\n",
            "[3,   350] train_loss: 1.687 train_accuracy: 0.376 test_accuracy: 0.361\n",
            "[3,   355] train_loss: 1.756 train_accuracy: 0.375 test_accuracy: 0.364\n",
            "[3,   360] train_loss: 1.795 train_accuracy: 0.389 test_accuracy: 0.378\n",
            "[3,   365] train_loss: 1.745 train_accuracy: 0.394 test_accuracy: 0.379\n",
            "[3,   370] train_loss: 1.796 train_accuracy: 0.389 test_accuracy: 0.372\n",
            "[3,   375] train_loss: 1.828 train_accuracy: 0.374 test_accuracy: 0.357\n",
            "[3,   380] train_loss: 1.807 train_accuracy: 0.390 test_accuracy: 0.378\n",
            "[3,   385] train_loss: 1.848 train_accuracy: 0.385 test_accuracy: 0.380\n",
            "[3,   390] train_loss: 1.729 train_accuracy: 0.378 test_accuracy: 0.364\n",
            "[3,   395] train_loss: 1.878 train_accuracy: 0.375 test_accuracy: 0.359\n",
            "[3,   400] train_loss: 1.674 train_accuracy: 0.383 test_accuracy: 0.371\n",
            "[3,   405] train_loss: 1.659 train_accuracy: 0.389 test_accuracy: 0.377\n",
            "[3,   410] train_loss: 1.729 train_accuracy: 0.395 test_accuracy: 0.378\n",
            "[3,   415] train_loss: 1.692 train_accuracy: 0.400 test_accuracy: 0.379\n",
            "[3,   420] train_loss: 1.796 train_accuracy: 0.396 test_accuracy: 0.382\n",
            "[3,   425] train_loss: 1.731 train_accuracy: 0.382 test_accuracy: 0.373\n",
            "[3,   430] train_loss: 1.782 train_accuracy: 0.394 test_accuracy: 0.386\n",
            "[3,   435] train_loss: 1.856 train_accuracy: 0.397 test_accuracy: 0.381\n",
            "[3,   440] train_loss: 1.750 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   445] train_loss: 1.703 train_accuracy: 0.393 test_accuracy: 0.380\n",
            "[3,   450] train_loss: 1.766 train_accuracy: 0.401 test_accuracy: 0.387\n",
            "[3,   455] train_loss: 1.829 train_accuracy: 0.387 test_accuracy: 0.368\n",
            "[3,   460] train_loss: 1.761 train_accuracy: 0.374 test_accuracy: 0.350\n",
            "[3,   465] train_loss: 1.731 train_accuracy: 0.374 test_accuracy: 0.357\n",
            "[3,   470] train_loss: 1.733 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[3,   475] train_loss: 1.723 train_accuracy: 0.392 test_accuracy: 0.380\n",
            "[3,   480] train_loss: 1.875 train_accuracy: 0.388 test_accuracy: 0.378\n",
            "[3,   485] train_loss: 1.728 train_accuracy: 0.381 test_accuracy: 0.370\n",
            "[3,   490] train_loss: 1.701 train_accuracy: 0.390 test_accuracy: 0.377\n",
            "[3,   495] train_loss: 1.781 train_accuracy: 0.399 test_accuracy: 0.380\n",
            "[3,   500] train_loss: 1.698 train_accuracy: 0.393 test_accuracy: 0.375\n",
            "[3,   505] train_loss: 1.788 train_accuracy: 0.376 test_accuracy: 0.365\n",
            "[3,   510] train_loss: 1.773 train_accuracy: 0.367 test_accuracy: 0.355\n",
            "[3,   515] train_loss: 1.765 train_accuracy: 0.394 test_accuracy: 0.370\n",
            "[3,   520] train_loss: 1.847 train_accuracy: 0.398 test_accuracy: 0.371\n",
            "[3,   525] train_loss: 1.872 train_accuracy: 0.394 test_accuracy: 0.375\n",
            "[3,   530] train_loss: 1.792 train_accuracy: 0.396 test_accuracy: 0.375\n",
            "[3,   535] train_loss: 1.814 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[3,   540] train_loss: 1.918 train_accuracy: 0.387 test_accuracy: 0.360\n",
            "[3,   545] train_loss: 1.751 train_accuracy: 0.380 test_accuracy: 0.359\n",
            "[3,   550] train_loss: 1.797 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[3,   555] train_loss: 1.631 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[3,   560] train_loss: 1.665 train_accuracy: 0.395 test_accuracy: 0.368\n",
            "[3,   565] train_loss: 1.612 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[3,   570] train_loss: 1.786 train_accuracy: 0.401 test_accuracy: 0.376\n",
            "[3,   575] train_loss: 1.897 train_accuracy: 0.397 test_accuracy: 0.372\n",
            "[3,   580] train_loss: 1.701 train_accuracy: 0.389 test_accuracy: 0.368\n",
            "[3,   585] train_loss: 1.824 train_accuracy: 0.390 test_accuracy: 0.366\n",
            "[3,   590] train_loss: 1.836 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[3,   595] train_loss: 1.715 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[3,   600] train_loss: 1.875 train_accuracy: 0.363 test_accuracy: 0.343\n",
            "[3,   605] train_loss: 1.765 train_accuracy: 0.362 test_accuracy: 0.353\n",
            "[3,   610] train_loss: 1.805 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[3,   615] train_loss: 1.703 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[3,   620] train_loss: 1.771 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[3,   625] train_loss: 1.744 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[3,   630] train_loss: 1.705 train_accuracy: 0.392 test_accuracy: 0.372\n",
            "[3,   635] train_loss: 1.903 train_accuracy: 0.403 test_accuracy: 0.373\n",
            "[3,   640] train_loss: 1.756 train_accuracy: 0.411 test_accuracy: 0.386\n",
            "[3,   645] train_loss: 1.759 train_accuracy: 0.407 test_accuracy: 0.382\n",
            "[3,   650] train_loss: 1.701 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[3,   655] train_loss: 1.807 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[3,   660] train_loss: 1.809 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[3,   665] train_loss: 1.761 train_accuracy: 0.378 test_accuracy: 0.371\n",
            "[3,   670] train_loss: 1.667 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[3,   675] train_loss: 1.817 train_accuracy: 0.376 test_accuracy: 0.364\n",
            "[3,   680] train_loss: 1.807 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[3,   685] train_loss: 1.746 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[3,   690] train_loss: 1.749 train_accuracy: 0.407 test_accuracy: 0.385\n",
            "[3,   695] train_loss: 1.816 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[3,   700] train_loss: 1.748 train_accuracy: 0.391 test_accuracy: 0.375\n",
            "[3,   705] train_loss: 1.861 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[3,   710] train_loss: 1.822 train_accuracy: 0.381 test_accuracy: 0.362\n",
            "[3,   715] train_loss: 1.812 train_accuracy: 0.377 test_accuracy: 0.360\n",
            "[3,   720] train_loss: 1.824 train_accuracy: 0.387 test_accuracy: 0.369\n",
            "[3,   725] train_loss: 1.796 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[3,   730] train_loss: 1.784 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[3,   735] train_loss: 1.789 train_accuracy: 0.399 test_accuracy: 0.383\n",
            "[3,   740] train_loss: 1.675 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[3,   745] train_loss: 1.803 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,   750] train_loss: 1.884 train_accuracy: 0.386 test_accuracy: 0.368\n",
            "[3,   755] train_loss: 1.714 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[3,   760] train_loss: 1.706 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   765] train_loss: 1.811 train_accuracy: 0.383 test_accuracy: 0.370\n",
            "[3,   770] train_loss: 1.661 train_accuracy: 0.367 test_accuracy: 0.363\n",
            "[3,   775] train_loss: 1.863 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[3,   780] train_loss: 1.781 train_accuracy: 0.399 test_accuracy: 0.373\n",
            "[3,   785] train_loss: 1.813 train_accuracy: 0.386 test_accuracy: 0.368\n",
            "[3,   790] train_loss: 1.788 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[3,   795] train_loss: 1.794 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[3,   800] train_loss: 1.834 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[3,   805] train_loss: 1.826 train_accuracy: 0.376 test_accuracy: 0.354\n",
            "[3,   810] train_loss: 1.948 train_accuracy: 0.388 test_accuracy: 0.363\n",
            "[3,   815] train_loss: 1.913 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[3,   820] train_loss: 1.776 train_accuracy: 0.392 test_accuracy: 0.377\n",
            "[3,   825] train_loss: 1.717 train_accuracy: 0.382 test_accuracy: 0.370\n",
            "[3,   830] train_loss: 1.816 train_accuracy: 0.389 test_accuracy: 0.373\n",
            "[3,   835] train_loss: 1.810 train_accuracy: 0.400 test_accuracy: 0.374\n",
            "[3,   840] train_loss: 1.759 train_accuracy: 0.380 test_accuracy: 0.364\n",
            "[3,   845] train_loss: 1.822 train_accuracy: 0.397 test_accuracy: 0.376\n",
            "[3,   850] train_loss: 1.829 train_accuracy: 0.389 test_accuracy: 0.373\n",
            "[3,   855] train_loss: 1.802 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[3,   860] train_loss: 1.799 train_accuracy: 0.388 test_accuracy: 0.370\n",
            "[3,   865] train_loss: 1.707 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[3,   870] train_loss: 1.748 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[3,   875] train_loss: 1.755 train_accuracy: 0.379 test_accuracy: 0.364\n",
            "[3,   880] train_loss: 1.743 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[3,   885] train_loss: 1.617 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[3,   890] train_loss: 1.871 train_accuracy: 0.383 test_accuracy: 0.370\n",
            "[3,   895] train_loss: 1.913 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[3,   900] train_loss: 1.786 train_accuracy: 0.396 test_accuracy: 0.379\n",
            "[3,   905] train_loss: 1.879 train_accuracy: 0.385 test_accuracy: 0.364\n",
            "[3,   910] train_loss: 1.809 train_accuracy: 0.396 test_accuracy: 0.380\n",
            "[3,   915] train_loss: 1.812 train_accuracy: 0.379 test_accuracy: 0.366\n",
            "[3,   920] train_loss: 1.802 train_accuracy: 0.388 test_accuracy: 0.370\n",
            "[3,   925] train_loss: 1.797 train_accuracy: 0.399 test_accuracy: 0.372\n",
            "[3,   930] train_loss: 1.812 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[3,   935] train_loss: 1.680 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[3,   940] train_loss: 1.665 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[3,   945] train_loss: 1.712 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[3,   950] train_loss: 1.733 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[3,   955] train_loss: 1.905 train_accuracy: 0.399 test_accuracy: 0.379\n",
            "[3,   960] train_loss: 1.721 train_accuracy: 0.389 test_accuracy: 0.365\n",
            "[3,   965] train_loss: 1.796 train_accuracy: 0.395 test_accuracy: 0.377\n",
            "[3,   970] train_loss: 1.711 train_accuracy: 0.372 test_accuracy: 0.357\n",
            "[3,   975] train_loss: 1.924 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[3,   980] train_loss: 1.753 train_accuracy: 0.387 test_accuracy: 0.365\n",
            "[3,   985] train_loss: 1.692 train_accuracy: 0.395 test_accuracy: 0.373\n",
            "[3,   990] train_loss: 1.766 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[3,   995] train_loss: 1.710 train_accuracy: 0.398 test_accuracy: 0.384\n",
            "[3,  1000] train_loss: 1.725 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[3,  1005] train_loss: 1.766 train_accuracy: 0.398 test_accuracy: 0.368\n",
            "[3,  1010] train_loss: 1.784 train_accuracy: 0.396 test_accuracy: 0.369\n",
            "[3,  1015] train_loss: 1.792 train_accuracy: 0.398 test_accuracy: 0.371\n",
            "[3,  1020] train_loss: 1.662 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[3,  1025] train_loss: 1.715 train_accuracy: 0.390 test_accuracy: 0.375\n",
            "[3,  1030] train_loss: 1.776 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[3,  1035] train_loss: 1.886 train_accuracy: 0.408 test_accuracy: 0.384\n",
            "[3,  1040] train_loss: 1.691 train_accuracy: 0.398 test_accuracy: 0.373\n",
            "[3,  1045] train_loss: 1.927 train_accuracy: 0.397 test_accuracy: 0.379\n",
            "[3,  1050] train_loss: 1.811 train_accuracy: 0.394 test_accuracy: 0.374\n",
            "[3,  1055] train_loss: 1.737 train_accuracy: 0.390 test_accuracy: 0.366\n",
            "[3,  1060] train_loss: 1.667 train_accuracy: 0.384 test_accuracy: 0.358\n",
            "[3,  1065] train_loss: 1.657 train_accuracy: 0.395 test_accuracy: 0.374\n",
            "[3,  1070] train_loss: 1.746 train_accuracy: 0.405 test_accuracy: 0.379\n",
            "[3,  1075] train_loss: 1.815 train_accuracy: 0.406 test_accuracy: 0.378\n",
            "[3,  1080] train_loss: 1.800 train_accuracy: 0.395 test_accuracy: 0.370\n",
            "[3,  1085] train_loss: 1.771 train_accuracy: 0.396 test_accuracy: 0.374\n",
            "[3,  1090] train_loss: 1.824 train_accuracy: 0.387 test_accuracy: 0.369\n",
            "[3,  1095] train_loss: 1.768 train_accuracy: 0.397 test_accuracy: 0.377\n",
            "[3,  1100] train_loss: 1.792 train_accuracy: 0.396 test_accuracy: 0.379\n",
            "[3,  1105] train_loss: 1.603 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[3,  1110] train_loss: 1.807 train_accuracy: 0.376 test_accuracy: 0.356\n",
            "[3,  1115] train_loss: 1.925 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,  1120] train_loss: 1.772 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[3,  1125] train_loss: 1.752 train_accuracy: 0.408 test_accuracy: 0.395\n",
            "[3,  1130] train_loss: 1.765 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[3,  1135] train_loss: 1.811 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[3,  1140] train_loss: 1.789 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[3,  1145] train_loss: 1.812 train_accuracy: 0.403 test_accuracy: 0.380\n",
            "[3,  1150] train_loss: 1.673 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[3,  1155] train_loss: 1.734 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[3,  1160] train_loss: 1.657 train_accuracy: 0.396 test_accuracy: 0.373\n",
            "[3,  1165] train_loss: 1.705 train_accuracy: 0.384 test_accuracy: 0.369\n",
            "[3,  1170] train_loss: 1.828 train_accuracy: 0.397 test_accuracy: 0.377\n",
            "[3,  1175] train_loss: 1.812 train_accuracy: 0.406 test_accuracy: 0.384\n",
            "[3,  1180] train_loss: 1.713 train_accuracy: 0.395 test_accuracy: 0.375\n",
            "[3,  1185] train_loss: 1.818 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[3,  1190] train_loss: 1.645 train_accuracy: 0.396 test_accuracy: 0.379\n",
            "[3,  1195] train_loss: 1.824 train_accuracy: 0.397 test_accuracy: 0.381\n",
            "[3,  1200] train_loss: 1.980 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,  1205] train_loss: 1.819 train_accuracy: 0.404 test_accuracy: 0.387\n",
            "[3,  1210] train_loss: 1.714 train_accuracy: 0.397 test_accuracy: 0.382\n",
            "[3,  1215] train_loss: 1.693 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[3,  1220] train_loss: 1.721 train_accuracy: 0.398 test_accuracy: 0.386\n",
            "[3,  1225] train_loss: 1.873 train_accuracy: 0.391 test_accuracy: 0.383\n",
            "[3,  1230] train_loss: 1.791 train_accuracy: 0.384 test_accuracy: 0.367\n",
            "[3,  1235] train_loss: 1.622 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[3,  1240] train_loss: 1.785 train_accuracy: 0.390 test_accuracy: 0.368\n",
            "[3,  1245] train_loss: 1.754 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[4,     5] train_loss: 1.782 train_accuracy: 0.387 test_accuracy: 0.368\n",
            "[4,    10] train_loss: 1.715 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[4,    15] train_loss: 1.795 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[4,    20] train_loss: 1.738 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[4,    25] train_loss: 1.803 train_accuracy: 0.383 test_accuracy: 0.373\n",
            "[4,    30] train_loss: 1.634 train_accuracy: 0.398 test_accuracy: 0.380\n",
            "[4,    35] train_loss: 1.699 train_accuracy: 0.397 test_accuracy: 0.376\n",
            "[4,    40] train_loss: 1.818 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[4,    45] train_loss: 1.640 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[4,    50] train_loss: 1.918 train_accuracy: 0.383 test_accuracy: 0.368\n",
            "[4,    55] train_loss: 1.716 train_accuracy: 0.374 test_accuracy: 0.366\n",
            "[4,    60] train_loss: 1.740 train_accuracy: 0.382 test_accuracy: 0.370\n",
            "[4,    65] train_loss: 1.820 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[4,    70] train_loss: 1.821 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[4,    75] train_loss: 1.746 train_accuracy: 0.405 test_accuracy: 0.379\n",
            "[4,    80] train_loss: 1.774 train_accuracy: 0.414 test_accuracy: 0.385\n",
            "[4,    85] train_loss: 1.658 train_accuracy: 0.403 test_accuracy: 0.381\n",
            "[4,    90] train_loss: 1.749 train_accuracy: 0.382 test_accuracy: 0.377\n",
            "[4,    95] train_loss: 1.849 train_accuracy: 0.376 test_accuracy: 0.373\n",
            "[4,   100] train_loss: 1.758 train_accuracy: 0.392 test_accuracy: 0.380\n",
            "[4,   105] train_loss: 1.817 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[4,   110] train_loss: 1.896 train_accuracy: 0.400 test_accuracy: 0.385\n",
            "[4,   115] train_loss: 1.774 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[4,   120] train_loss: 1.850 train_accuracy: 0.397 test_accuracy: 0.379\n",
            "[4,   125] train_loss: 1.789 train_accuracy: 0.402 test_accuracy: 0.382\n",
            "[4,   130] train_loss: 1.690 train_accuracy: 0.386 test_accuracy: 0.374\n",
            "[4,   135] train_loss: 1.820 train_accuracy: 0.400 test_accuracy: 0.384\n",
            "[4,   140] train_loss: 1.783 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[4,   145] train_loss: 1.870 train_accuracy: 0.404 test_accuracy: 0.392\n",
            "[4,   150] train_loss: 1.742 train_accuracy: 0.396 test_accuracy: 0.383\n",
            "[4,   155] train_loss: 1.796 train_accuracy: 0.383 test_accuracy: 0.372\n",
            "[4,   160] train_loss: 1.767 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[4,   165] train_loss: 1.797 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[4,   170] train_loss: 1.905 train_accuracy: 0.388 test_accuracy: 0.374\n",
            "[4,   175] train_loss: 1.795 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,   180] train_loss: 1.775 train_accuracy: 0.395 test_accuracy: 0.372\n",
            "[4,   185] train_loss: 1.806 train_accuracy: 0.356 test_accuracy: 0.340\n",
            "[4,   190] train_loss: 1.709 train_accuracy: 0.381 test_accuracy: 0.363\n",
            "[4,   195] train_loss: 1.860 train_accuracy: 0.390 test_accuracy: 0.368\n",
            "[4,   200] train_loss: 1.716 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[4,   205] train_loss: 1.687 train_accuracy: 0.394 test_accuracy: 0.381\n",
            "[4,   210] train_loss: 1.812 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[4,   215] train_loss: 1.915 train_accuracy: 0.382 test_accuracy: 0.366\n",
            "[4,   220] train_loss: 1.730 train_accuracy: 0.371 test_accuracy: 0.359\n",
            "[4,   225] train_loss: 1.841 train_accuracy: 0.379 test_accuracy: 0.360\n",
            "[4,   230] train_loss: 1.782 train_accuracy: 0.373 test_accuracy: 0.363\n",
            "[4,   235] train_loss: 1.694 train_accuracy: 0.381 test_accuracy: 0.377\n",
            "[4,   240] train_loss: 1.767 train_accuracy: 0.390 test_accuracy: 0.375\n",
            "[4,   245] train_loss: 1.745 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[4,   250] train_loss: 1.744 train_accuracy: 0.384 test_accuracy: 0.369\n",
            "[4,   255] train_loss: 1.731 train_accuracy: 0.381 test_accuracy: 0.367\n",
            "[4,   260] train_loss: 1.712 train_accuracy: 0.400 test_accuracy: 0.378\n",
            "[4,   265] train_loss: 1.686 train_accuracy: 0.400 test_accuracy: 0.374\n",
            "[4,   270] train_loss: 1.766 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,   275] train_loss: 1.800 train_accuracy: 0.404 test_accuracy: 0.381\n",
            "[4,   280] train_loss: 1.746 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[4,   285] train_loss: 1.840 train_accuracy: 0.373 test_accuracy: 0.359\n",
            "[4,   290] train_loss: 1.761 train_accuracy: 0.392 test_accuracy: 0.368\n",
            "[4,   295] train_loss: 1.836 train_accuracy: 0.402 test_accuracy: 0.379\n",
            "[4,   300] train_loss: 1.720 train_accuracy: 0.401 test_accuracy: 0.375\n",
            "[4,   305] train_loss: 1.789 train_accuracy: 0.403 test_accuracy: 0.377\n",
            "[4,   310] train_loss: 1.525 train_accuracy: 0.383 test_accuracy: 0.365\n",
            "[4,   315] train_loss: 1.749 train_accuracy: 0.376 test_accuracy: 0.367\n",
            "[4,   320] train_loss: 1.687 train_accuracy: 0.365 test_accuracy: 0.355\n",
            "[4,   325] train_loss: 1.775 train_accuracy: 0.386 test_accuracy: 0.376\n",
            "[4,   330] train_loss: 1.747 train_accuracy: 0.388 test_accuracy: 0.375\n",
            "[4,   335] train_loss: 1.861 train_accuracy: 0.394 test_accuracy: 0.368\n",
            "[4,   340] train_loss: 1.777 train_accuracy: 0.400 test_accuracy: 0.375\n",
            "[4,   345] train_loss: 1.671 train_accuracy: 0.403 test_accuracy: 0.380\n",
            "[4,   350] train_loss: 1.732 train_accuracy: 0.404 test_accuracy: 0.383\n",
            "[4,   355] train_loss: 1.720 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[4,   360] train_loss: 1.721 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[4,   365] train_loss: 1.757 train_accuracy: 0.391 test_accuracy: 0.380\n",
            "[4,   370] train_loss: 1.773 train_accuracy: 0.395 test_accuracy: 0.374\n",
            "[4,   375] train_loss: 1.736 train_accuracy: 0.395 test_accuracy: 0.378\n",
            "[4,   380] train_loss: 1.676 train_accuracy: 0.399 test_accuracy: 0.376\n",
            "[4,   385] train_loss: 1.830 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[4,   390] train_loss: 1.762 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[4,   395] train_loss: 1.764 train_accuracy: 0.392 test_accuracy: 0.380\n",
            "[4,   400] train_loss: 1.773 train_accuracy: 0.395 test_accuracy: 0.382\n",
            "[4,   405] train_loss: 1.755 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[4,   410] train_loss: 1.805 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[4,   415] train_loss: 1.785 train_accuracy: 0.400 test_accuracy: 0.384\n",
            "[4,   420] train_loss: 1.718 train_accuracy: 0.411 test_accuracy: 0.390\n",
            "[4,   425] train_loss: 1.952 train_accuracy: 0.407 test_accuracy: 0.382\n",
            "[4,   430] train_loss: 1.813 train_accuracy: 0.403 test_accuracy: 0.384\n",
            "[4,   435] train_loss: 1.756 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[4,   440] train_loss: 1.681 train_accuracy: 0.394 test_accuracy: 0.377\n",
            "[4,   445] train_loss: 1.811 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[4,   450] train_loss: 1.893 train_accuracy: 0.385 test_accuracy: 0.370\n",
            "[4,   455] train_loss: 1.728 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[4,   460] train_loss: 1.767 train_accuracy: 0.400 test_accuracy: 0.382\n",
            "[4,   465] train_loss: 1.805 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[4,   470] train_loss: 1.618 train_accuracy: 0.389 test_accuracy: 0.370\n",
            "[4,   475] train_loss: 1.677 train_accuracy: 0.394 test_accuracy: 0.366\n",
            "[4,   480] train_loss: 1.839 train_accuracy: 0.384 test_accuracy: 0.364\n",
            "[4,   485] train_loss: 1.712 train_accuracy: 0.385 test_accuracy: 0.368\n",
            "[4,   490] train_loss: 1.706 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[4,   495] train_loss: 1.762 train_accuracy: 0.408 test_accuracy: 0.384\n",
            "[4,   500] train_loss: 1.672 train_accuracy: 0.402 test_accuracy: 0.381\n",
            "[4,   505] train_loss: 1.725 train_accuracy: 0.397 test_accuracy: 0.379\n",
            "[4,   510] train_loss: 1.781 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[4,   515] train_loss: 1.704 train_accuracy: 0.396 test_accuracy: 0.384\n",
            "[4,   520] train_loss: 1.651 train_accuracy: 0.388 test_accuracy: 0.377\n",
            "[4,   525] train_loss: 1.679 train_accuracy: 0.386 test_accuracy: 0.379\n",
            "[4,   530] train_loss: 1.849 train_accuracy: 0.394 test_accuracy: 0.380\n",
            "[4,   535] train_loss: 1.903 train_accuracy: 0.388 test_accuracy: 0.368\n",
            "[4,   540] train_loss: 1.841 train_accuracy: 0.389 test_accuracy: 0.369\n",
            "[4,   545] train_loss: 1.687 train_accuracy: 0.395 test_accuracy: 0.378\n",
            "[4,   550] train_loss: 1.727 train_accuracy: 0.397 test_accuracy: 0.388\n",
            "[4,   555] train_loss: 1.777 train_accuracy: 0.382 test_accuracy: 0.369\n",
            "[4,   560] train_loss: 1.724 train_accuracy: 0.381 test_accuracy: 0.368\n",
            "[4,   565] train_loss: 1.720 train_accuracy: 0.393 test_accuracy: 0.379\n",
            "[4,   570] train_loss: 1.654 train_accuracy: 0.393 test_accuracy: 0.382\n",
            "[4,   575] train_loss: 1.673 train_accuracy: 0.378 test_accuracy: 0.371\n",
            "[4,   580] train_loss: 1.802 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[4,   585] train_loss: 1.790 train_accuracy: 0.397 test_accuracy: 0.374\n",
            "[4,   590] train_loss: 1.735 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[4,   595] train_loss: 1.595 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[4,   600] train_loss: 1.738 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[4,   605] train_loss: 1.805 train_accuracy: 0.401 test_accuracy: 0.385\n",
            "[4,   610] train_loss: 1.756 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[4,   615] train_loss: 1.691 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[4,   620] train_loss: 1.784 train_accuracy: 0.403 test_accuracy: 0.380\n",
            "[4,   625] train_loss: 1.682 train_accuracy: 0.394 test_accuracy: 0.374\n",
            "[4,   630] train_loss: 1.605 train_accuracy: 0.401 test_accuracy: 0.386\n",
            "[4,   635] train_loss: 1.740 train_accuracy: 0.397 test_accuracy: 0.385\n",
            "[4,   640] train_loss: 1.813 train_accuracy: 0.403 test_accuracy: 0.385\n",
            "[4,   645] train_loss: 1.698 train_accuracy: 0.396 test_accuracy: 0.388\n",
            "[4,   650] train_loss: 1.778 train_accuracy: 0.392 test_accuracy: 0.380\n",
            "[4,   655] train_loss: 1.765 train_accuracy: 0.392 test_accuracy: 0.380\n",
            "[4,   660] train_loss: 1.751 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[4,   665] train_loss: 1.790 train_accuracy: 0.383 test_accuracy: 0.371\n",
            "[4,   670] train_loss: 1.870 train_accuracy: 0.395 test_accuracy: 0.378\n",
            "[4,   675] train_loss: 1.764 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[4,   680] train_loss: 1.736 train_accuracy: 0.411 test_accuracy: 0.390\n",
            "[4,   685] train_loss: 1.785 train_accuracy: 0.401 test_accuracy: 0.383\n",
            "[4,   690] train_loss: 1.778 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[4,   695] train_loss: 1.763 train_accuracy: 0.400 test_accuracy: 0.384\n",
            "[4,   700] train_loss: 1.812 train_accuracy: 0.402 test_accuracy: 0.386\n",
            "[4,   705] train_loss: 1.778 train_accuracy: 0.405 test_accuracy: 0.390\n",
            "[4,   710] train_loss: 1.663 train_accuracy: 0.394 test_accuracy: 0.377\n",
            "[4,   715] train_loss: 1.812 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[4,   720] train_loss: 1.599 train_accuracy: 0.410 test_accuracy: 0.387\n",
            "[4,   725] train_loss: 1.728 train_accuracy: 0.406 test_accuracy: 0.388\n",
            "[4,   730] train_loss: 1.845 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[4,   735] train_loss: 1.697 train_accuracy: 0.391 test_accuracy: 0.375\n",
            "[4,   740] train_loss: 1.715 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[4,   745] train_loss: 1.751 train_accuracy: 0.400 test_accuracy: 0.382\n",
            "[4,   750] train_loss: 1.836 train_accuracy: 0.400 test_accuracy: 0.387\n",
            "[4,   755] train_loss: 1.622 train_accuracy: 0.407 test_accuracy: 0.388\n",
            "[4,   760] train_loss: 1.896 train_accuracy: 0.395 test_accuracy: 0.384\n",
            "[4,   765] train_loss: 1.749 train_accuracy: 0.404 test_accuracy: 0.389\n",
            "[4,   770] train_loss: 1.728 train_accuracy: 0.394 test_accuracy: 0.377\n",
            "[4,   775] train_loss: 1.768 train_accuracy: 0.392 test_accuracy: 0.377\n",
            "[4,   780] train_loss: 1.815 train_accuracy: 0.398 test_accuracy: 0.369\n",
            "[4,   785] train_loss: 1.781 train_accuracy: 0.397 test_accuracy: 0.370\n",
            "[4,   790] train_loss: 1.837 train_accuracy: 0.392 test_accuracy: 0.372\n",
            "[4,   795] train_loss: 1.841 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[4,   800] train_loss: 1.819 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,   805] train_loss: 1.685 train_accuracy: 0.398 test_accuracy: 0.379\n",
            "[4,   810] train_loss: 1.811 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[4,   815] train_loss: 1.684 train_accuracy: 0.414 test_accuracy: 0.391\n",
            "[4,   820] train_loss: 1.691 train_accuracy: 0.403 test_accuracy: 0.387\n",
            "[4,   825] train_loss: 1.700 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[4,   830] train_loss: 1.770 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[4,   835] train_loss: 1.821 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[4,   840] train_loss: 1.741 train_accuracy: 0.396 test_accuracy: 0.376\n",
            "[4,   845] train_loss: 1.797 train_accuracy: 0.405 test_accuracy: 0.378\n",
            "[4,   850] train_loss: 1.856 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[4,   855] train_loss: 1.714 train_accuracy: 0.399 test_accuracy: 0.388\n",
            "[4,   860] train_loss: 1.784 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[4,   865] train_loss: 1.816 train_accuracy: 0.399 test_accuracy: 0.379\n",
            "[4,   870] train_loss: 1.639 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[4,   875] train_loss: 1.773 train_accuracy: 0.398 test_accuracy: 0.384\n",
            "[4,   880] train_loss: 1.773 train_accuracy: 0.408 test_accuracy: 0.390\n",
            "[4,   885] train_loss: 1.668 train_accuracy: 0.403 test_accuracy: 0.383\n",
            "[4,   890] train_loss: 1.592 train_accuracy: 0.389 test_accuracy: 0.370\n",
            "[4,   895] train_loss: 1.795 train_accuracy: 0.392 test_accuracy: 0.368\n",
            "[4,   900] train_loss: 1.705 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[4,   905] train_loss: 1.703 train_accuracy: 0.390 test_accuracy: 0.368\n",
            "[4,   910] train_loss: 1.811 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[4,   915] train_loss: 1.801 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[4,   920] train_loss: 1.800 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[4,   925] train_loss: 1.760 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[4,   930] train_loss: 1.744 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[4,   935] train_loss: 1.678 train_accuracy: 0.394 test_accuracy: 0.372\n",
            "[4,   940] train_loss: 1.882 train_accuracy: 0.400 test_accuracy: 0.379\n",
            "[4,   945] train_loss: 1.685 train_accuracy: 0.408 test_accuracy: 0.387\n",
            "[4,   950] train_loss: 1.717 train_accuracy: 0.410 test_accuracy: 0.387\n",
            "[4,   955] train_loss: 1.796 train_accuracy: 0.401 test_accuracy: 0.387\n",
            "[4,   960] train_loss: 1.706 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[4,   965] train_loss: 1.742 train_accuracy: 0.403 test_accuracy: 0.381\n",
            "[4,   970] train_loss: 1.699 train_accuracy: 0.400 test_accuracy: 0.383\n",
            "[4,   975] train_loss: 1.741 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[4,   980] train_loss: 1.854 train_accuracy: 0.407 test_accuracy: 0.391\n",
            "[4,   985] train_loss: 1.799 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[4,   990] train_loss: 1.786 train_accuracy: 0.404 test_accuracy: 0.382\n",
            "[4,   995] train_loss: 1.780 train_accuracy: 0.409 test_accuracy: 0.390\n",
            "[4,  1000] train_loss: 1.852 train_accuracy: 0.403 test_accuracy: 0.381\n",
            "[4,  1005] train_loss: 1.741 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[4,  1010] train_loss: 1.725 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[4,  1015] train_loss: 1.821 train_accuracy: 0.396 test_accuracy: 0.376\n",
            "[4,  1020] train_loss: 1.776 train_accuracy: 0.408 test_accuracy: 0.385\n",
            "[4,  1025] train_loss: 1.685 train_accuracy: 0.405 test_accuracy: 0.380\n",
            "[4,  1030] train_loss: 1.693 train_accuracy: 0.404 test_accuracy: 0.386\n",
            "[4,  1035] train_loss: 1.854 train_accuracy: 0.399 test_accuracy: 0.384\n",
            "[4,  1040] train_loss: 1.777 train_accuracy: 0.401 test_accuracy: 0.383\n",
            "[4,  1045] train_loss: 1.743 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[4,  1050] train_loss: 1.650 train_accuracy: 0.391 test_accuracy: 0.375\n",
            "[4,  1055] train_loss: 1.627 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[4,  1060] train_loss: 1.626 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[4,  1065] train_loss: 1.992 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[4,  1070] train_loss: 1.779 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[4,  1075] train_loss: 1.702 train_accuracy: 0.397 test_accuracy: 0.373\n",
            "[4,  1080] train_loss: 1.618 train_accuracy: 0.399 test_accuracy: 0.378\n",
            "[4,  1085] train_loss: 1.744 train_accuracy: 0.405 test_accuracy: 0.382\n",
            "[4,  1090] train_loss: 1.550 train_accuracy: 0.393 test_accuracy: 0.370\n",
            "[4,  1095] train_loss: 1.790 train_accuracy: 0.403 test_accuracy: 0.381\n",
            "[4,  1100] train_loss: 1.579 train_accuracy: 0.399 test_accuracy: 0.378\n",
            "[4,  1105] train_loss: 1.713 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[4,  1110] train_loss: 1.831 train_accuracy: 0.375 test_accuracy: 0.359\n",
            "[4,  1115] train_loss: 1.787 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[4,  1120] train_loss: 1.739 train_accuracy: 0.392 test_accuracy: 0.374\n",
            "[4,  1125] train_loss: 1.762 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[4,  1130] train_loss: 1.805 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[4,  1135] train_loss: 1.728 train_accuracy: 0.397 test_accuracy: 0.372\n",
            "[4,  1140] train_loss: 1.712 train_accuracy: 0.412 test_accuracy: 0.381\n",
            "[4,  1145] train_loss: 1.832 train_accuracy: 0.411 test_accuracy: 0.387\n",
            "[4,  1150] train_loss: 1.710 train_accuracy: 0.403 test_accuracy: 0.385\n",
            "[4,  1155] train_loss: 1.714 train_accuracy: 0.407 test_accuracy: 0.384\n",
            "[4,  1160] train_loss: 1.815 train_accuracy: 0.405 test_accuracy: 0.386\n",
            "[4,  1165] train_loss: 1.771 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[4,  1170] train_loss: 1.836 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[4,  1175] train_loss: 1.792 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[4,  1180] train_loss: 1.752 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[4,  1185] train_loss: 1.696 train_accuracy: 0.392 test_accuracy: 0.371\n",
            "[4,  1190] train_loss: 1.688 train_accuracy: 0.395 test_accuracy: 0.373\n",
            "[4,  1195] train_loss: 1.800 train_accuracy: 0.405 test_accuracy: 0.385\n",
            "[4,  1200] train_loss: 1.759 train_accuracy: 0.392 test_accuracy: 0.378\n",
            "[4,  1205] train_loss: 1.796 train_accuracy: 0.374 test_accuracy: 0.362\n",
            "[4,  1210] train_loss: 1.900 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[4,  1215] train_loss: 1.708 train_accuracy: 0.403 test_accuracy: 0.381\n",
            "[4,  1220] train_loss: 1.756 train_accuracy: 0.401 test_accuracy: 0.372\n",
            "[4,  1225] train_loss: 1.685 train_accuracy: 0.401 test_accuracy: 0.373\n",
            "[4,  1230] train_loss: 1.578 train_accuracy: 0.403 test_accuracy: 0.380\n",
            "[4,  1235] train_loss: 1.781 train_accuracy: 0.390 test_accuracy: 0.376\n",
            "[4,  1240] train_loss: 1.696 train_accuracy: 0.406 test_accuracy: 0.385\n",
            "[4,  1245] train_loss: 1.728 train_accuracy: 0.409 test_accuracy: 0.386\n",
            "[5,     5] train_loss: 1.767 train_accuracy: 0.393 test_accuracy: 0.373\n",
            "[5,    10] train_loss: 1.733 train_accuracy: 0.390 test_accuracy: 0.376\n",
            "[5,    15] train_loss: 1.720 train_accuracy: 0.395 test_accuracy: 0.380\n",
            "[5,    20] train_loss: 1.652 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[5,    25] train_loss: 1.834 train_accuracy: 0.381 test_accuracy: 0.364\n",
            "[5,    30] train_loss: 1.637 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[5,    35] train_loss: 1.687 train_accuracy: 0.390 test_accuracy: 0.378\n",
            "[5,    40] train_loss: 1.788 train_accuracy: 0.388 test_accuracy: 0.372\n",
            "[5,    45] train_loss: 1.623 train_accuracy: 0.389 test_accuracy: 0.372\n",
            "[5,    50] train_loss: 1.816 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[5,    55] train_loss: 1.797 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[5,    60] train_loss: 1.843 train_accuracy: 0.388 test_accuracy: 0.375\n",
            "[5,    65] train_loss: 1.720 train_accuracy: 0.396 test_accuracy: 0.373\n",
            "[5,    70] train_loss: 1.760 train_accuracy: 0.404 test_accuracy: 0.377\n",
            "[5,    75] train_loss: 1.612 train_accuracy: 0.397 test_accuracy: 0.370\n",
            "[5,    80] train_loss: 1.754 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[5,    85] train_loss: 1.608 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,    90] train_loss: 1.848 train_accuracy: 0.409 test_accuracy: 0.388\n",
            "[5,    95] train_loss: 1.683 train_accuracy: 0.413 test_accuracy: 0.390\n",
            "[5,   100] train_loss: 1.721 train_accuracy: 0.406 test_accuracy: 0.384\n",
            "[5,   105] train_loss: 1.625 train_accuracy: 0.409 test_accuracy: 0.387\n",
            "[5,   110] train_loss: 1.753 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[5,   115] train_loss: 1.741 train_accuracy: 0.384 test_accuracy: 0.372\n",
            "[5,   120] train_loss: 1.808 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[5,   125] train_loss: 1.665 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[5,   130] train_loss: 1.794 train_accuracy: 0.407 test_accuracy: 0.383\n",
            "[5,   135] train_loss: 1.652 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   140] train_loss: 1.751 train_accuracy: 0.412 test_accuracy: 0.395\n",
            "[5,   145] train_loss: 1.626 train_accuracy: 0.413 test_accuracy: 0.391\n",
            "[5,   150] train_loss: 1.691 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[5,   155] train_loss: 1.715 train_accuracy: 0.404 test_accuracy: 0.379\n",
            "[5,   160] train_loss: 1.822 train_accuracy: 0.406 test_accuracy: 0.384\n",
            "[5,   165] train_loss: 1.613 train_accuracy: 0.402 test_accuracy: 0.381\n",
            "[5,   170] train_loss: 1.707 train_accuracy: 0.408 test_accuracy: 0.386\n",
            "[5,   175] train_loss: 1.863 train_accuracy: 0.412 test_accuracy: 0.384\n",
            "[5,   180] train_loss: 1.846 train_accuracy: 0.409 test_accuracy: 0.384\n",
            "[5,   185] train_loss: 1.838 train_accuracy: 0.411 test_accuracy: 0.385\n",
            "[5,   190] train_loss: 1.855 train_accuracy: 0.414 test_accuracy: 0.389\n",
            "[5,   195] train_loss: 1.712 train_accuracy: 0.409 test_accuracy: 0.387\n",
            "[5,   200] train_loss: 1.674 train_accuracy: 0.401 test_accuracy: 0.385\n",
            "[5,   205] train_loss: 1.772 train_accuracy: 0.410 test_accuracy: 0.389\n",
            "[5,   210] train_loss: 1.696 train_accuracy: 0.409 test_accuracy: 0.385\n",
            "[5,   215] train_loss: 1.661 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[5,   220] train_loss: 1.666 train_accuracy: 0.390 test_accuracy: 0.375\n",
            "[5,   225] train_loss: 1.737 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   230] train_loss: 1.665 train_accuracy: 0.406 test_accuracy: 0.389\n",
            "[5,   235] train_loss: 1.762 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   240] train_loss: 1.774 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   245] train_loss: 1.792 train_accuracy: 0.406 test_accuracy: 0.385\n",
            "[5,   250] train_loss: 1.753 train_accuracy: 0.406 test_accuracy: 0.381\n",
            "[5,   255] train_loss: 1.690 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[5,   260] train_loss: 1.696 train_accuracy: 0.412 test_accuracy: 0.384\n",
            "[5,   265] train_loss: 1.942 train_accuracy: 0.413 test_accuracy: 0.389\n",
            "[5,   270] train_loss: 1.683 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[5,   275] train_loss: 1.716 train_accuracy: 0.400 test_accuracy: 0.380\n",
            "[5,   280] train_loss: 1.798 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[5,   285] train_loss: 1.733 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[5,   290] train_loss: 1.605 train_accuracy: 0.398 test_accuracy: 0.382\n",
            "[5,   295] train_loss: 1.743 train_accuracy: 0.394 test_accuracy: 0.379\n",
            "[5,   300] train_loss: 1.719 train_accuracy: 0.402 test_accuracy: 0.382\n",
            "[5,   305] train_loss: 1.794 train_accuracy: 0.409 test_accuracy: 0.387\n",
            "[5,   310] train_loss: 1.612 train_accuracy: 0.414 test_accuracy: 0.391\n",
            "[5,   315] train_loss: 1.814 train_accuracy: 0.406 test_accuracy: 0.387\n",
            "[5,   320] train_loss: 1.753 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[5,   325] train_loss: 1.883 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[5,   330] train_loss: 1.637 train_accuracy: 0.392 test_accuracy: 0.378\n",
            "[5,   335] train_loss: 1.690 train_accuracy: 0.403 test_accuracy: 0.384\n",
            "[5,   340] train_loss: 1.677 train_accuracy: 0.405 test_accuracy: 0.390\n",
            "[5,   345] train_loss: 1.639 train_accuracy: 0.413 test_accuracy: 0.388\n",
            "[5,   350] train_loss: 1.684 train_accuracy: 0.401 test_accuracy: 0.377\n",
            "[5,   355] train_loss: 1.740 train_accuracy: 0.404 test_accuracy: 0.380\n",
            "[5,   360] train_loss: 1.777 train_accuracy: 0.401 test_accuracy: 0.376\n",
            "[5,   365] train_loss: 1.726 train_accuracy: 0.406 test_accuracy: 0.390\n",
            "[5,   370] train_loss: 1.826 train_accuracy: 0.405 test_accuracy: 0.390\n",
            "[5,   375] train_loss: 1.686 train_accuracy: 0.397 test_accuracy: 0.383\n",
            "[5,   380] train_loss: 1.615 train_accuracy: 0.403 test_accuracy: 0.384\n",
            "[5,   385] train_loss: 1.753 train_accuracy: 0.403 test_accuracy: 0.379\n",
            "[5,   390] train_loss: 1.656 train_accuracy: 0.386 test_accuracy: 0.368\n",
            "[5,   395] train_loss: 1.783 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[5,   400] train_loss: 1.816 train_accuracy: 0.397 test_accuracy: 0.383\n",
            "[5,   405] train_loss: 1.579 train_accuracy: 0.396 test_accuracy: 0.386\n",
            "[5,   410] train_loss: 1.651 train_accuracy: 0.402 test_accuracy: 0.385\n",
            "[5,   415] train_loss: 1.828 train_accuracy: 0.394 test_accuracy: 0.384\n",
            "[5,   420] train_loss: 1.698 train_accuracy: 0.401 test_accuracy: 0.386\n",
            "[5,   425] train_loss: 1.770 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,   430] train_loss: 1.863 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[5,   435] train_loss: 1.670 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[5,   440] train_loss: 1.723 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[5,   445] train_loss: 1.802 train_accuracy: 0.403 test_accuracy: 0.379\n",
            "[5,   450] train_loss: 1.665 train_accuracy: 0.404 test_accuracy: 0.377\n",
            "[5,   455] train_loss: 1.699 train_accuracy: 0.409 test_accuracy: 0.383\n",
            "[5,   460] train_loss: 1.756 train_accuracy: 0.414 test_accuracy: 0.387\n",
            "[5,   465] train_loss: 1.649 train_accuracy: 0.413 test_accuracy: 0.385\n",
            "[5,   470] train_loss: 1.661 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[5,   475] train_loss: 1.619 train_accuracy: 0.399 test_accuracy: 0.376\n",
            "[5,   480] train_loss: 1.665 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,   485] train_loss: 1.805 train_accuracy: 0.394 test_accuracy: 0.371\n",
            "[5,   490] train_loss: 1.602 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[5,   495] train_loss: 1.665 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[5,   500] train_loss: 1.664 train_accuracy: 0.394 test_accuracy: 0.377\n",
            "[5,   505] train_loss: 1.783 train_accuracy: 0.413 test_accuracy: 0.389\n",
            "[5,   510] train_loss: 1.831 train_accuracy: 0.411 test_accuracy: 0.385\n",
            "[5,   515] train_loss: 1.720 train_accuracy: 0.420 test_accuracy: 0.393\n",
            "[5,   520] train_loss: 1.718 train_accuracy: 0.414 test_accuracy: 0.386\n",
            "[5,   525] train_loss: 1.840 train_accuracy: 0.409 test_accuracy: 0.384\n",
            "[5,   530] train_loss: 1.760 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[5,   535] train_loss: 1.678 train_accuracy: 0.401 test_accuracy: 0.377\n",
            "[5,   540] train_loss: 1.697 train_accuracy: 0.406 test_accuracy: 0.380\n",
            "[5,   545] train_loss: 1.779 train_accuracy: 0.409 test_accuracy: 0.384\n",
            "[5,   550] train_loss: 1.697 train_accuracy: 0.405 test_accuracy: 0.377\n",
            "[5,   555] train_loss: 1.793 train_accuracy: 0.395 test_accuracy: 0.365\n",
            "[5,   560] train_loss: 1.661 train_accuracy: 0.398 test_accuracy: 0.368\n",
            "[5,   565] train_loss: 1.809 train_accuracy: 0.415 test_accuracy: 0.383\n",
            "[5,   570] train_loss: 1.773 train_accuracy: 0.406 test_accuracy: 0.384\n",
            "[5,   575] train_loss: 1.702 train_accuracy: 0.400 test_accuracy: 0.374\n",
            "[5,   580] train_loss: 1.659 train_accuracy: 0.387 test_accuracy: 0.360\n",
            "[5,   585] train_loss: 1.858 train_accuracy: 0.395 test_accuracy: 0.373\n",
            "[5,   590] train_loss: 1.960 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[5,   595] train_loss: 1.732 train_accuracy: 0.396 test_accuracy: 0.373\n",
            "[5,   600] train_loss: 1.723 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[5,   605] train_loss: 1.794 train_accuracy: 0.400 test_accuracy: 0.385\n",
            "[5,   610] train_loss: 1.722 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   615] train_loss: 1.748 train_accuracy: 0.409 test_accuracy: 0.383\n",
            "[5,   620] train_loss: 1.713 train_accuracy: 0.406 test_accuracy: 0.379\n",
            "[5,   625] train_loss: 1.718 train_accuracy: 0.409 test_accuracy: 0.378\n",
            "[5,   630] train_loss: 1.687 train_accuracy: 0.399 test_accuracy: 0.376\n",
            "[5,   635] train_loss: 1.776 train_accuracy: 0.396 test_accuracy: 0.379\n",
            "[5,   640] train_loss: 1.702 train_accuracy: 0.404 test_accuracy: 0.386\n",
            "[5,   645] train_loss: 1.735 train_accuracy: 0.403 test_accuracy: 0.380\n",
            "[5,   650] train_loss: 1.714 train_accuracy: 0.400 test_accuracy: 0.378\n",
            "[5,   655] train_loss: 1.765 train_accuracy: 0.400 test_accuracy: 0.378\n",
            "[5,   660] train_loss: 1.726 train_accuracy: 0.393 test_accuracy: 0.379\n",
            "[5,   665] train_loss: 1.669 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[5,   670] train_loss: 1.824 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[5,   675] train_loss: 1.720 train_accuracy: 0.407 test_accuracy: 0.379\n",
            "[5,   680] train_loss: 1.806 train_accuracy: 0.413 test_accuracy: 0.381\n",
            "[5,   685] train_loss: 1.792 train_accuracy: 0.418 test_accuracy: 0.389\n",
            "[5,   690] train_loss: 1.693 train_accuracy: 0.413 test_accuracy: 0.390\n",
            "[5,   695] train_loss: 1.651 train_accuracy: 0.412 test_accuracy: 0.390\n",
            "[5,   700] train_loss: 1.685 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[5,   705] train_loss: 1.848 train_accuracy: 0.403 test_accuracy: 0.388\n",
            "[5,   710] train_loss: 1.657 train_accuracy: 0.411 test_accuracy: 0.392\n",
            "[5,   715] train_loss: 1.743 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[5,   720] train_loss: 1.752 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[5,   725] train_loss: 1.747 train_accuracy: 0.412 test_accuracy: 0.391\n",
            "[5,   730] train_loss: 1.608 train_accuracy: 0.409 test_accuracy: 0.386\n",
            "[5,   735] train_loss: 1.687 train_accuracy: 0.397 test_accuracy: 0.379\n",
            "[5,   740] train_loss: 1.796 train_accuracy: 0.401 test_accuracy: 0.389\n",
            "[5,   745] train_loss: 1.677 train_accuracy: 0.405 test_accuracy: 0.390\n",
            "[5,   750] train_loss: 1.655 train_accuracy: 0.385 test_accuracy: 0.376\n",
            "[5,   755] train_loss: 1.710 train_accuracy: 0.402 test_accuracy: 0.385\n",
            "[5,   760] train_loss: 1.691 train_accuracy: 0.395 test_accuracy: 0.378\n",
            "[5,   765] train_loss: 1.738 train_accuracy: 0.390 test_accuracy: 0.366\n",
            "[5,   770] train_loss: 1.865 train_accuracy: 0.398 test_accuracy: 0.373\n",
            "[5,   775] train_loss: 1.732 train_accuracy: 0.405 test_accuracy: 0.380\n",
            "[5,   780] train_loss: 1.722 train_accuracy: 0.399 test_accuracy: 0.379\n",
            "[5,   785] train_loss: 1.739 train_accuracy: 0.403 test_accuracy: 0.385\n",
            "[5,   790] train_loss: 1.730 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[5,   795] train_loss: 1.594 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[5,   800] train_loss: 1.723 train_accuracy: 0.404 test_accuracy: 0.382\n",
            "[5,   805] train_loss: 1.642 train_accuracy: 0.401 test_accuracy: 0.377\n",
            "[5,   810] train_loss: 1.772 train_accuracy: 0.407 test_accuracy: 0.377\n",
            "[5,   815] train_loss: 1.721 train_accuracy: 0.409 test_accuracy: 0.383\n",
            "[5,   820] train_loss: 1.678 train_accuracy: 0.413 test_accuracy: 0.389\n",
            "[5,   825] train_loss: 1.728 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[5,   830] train_loss: 1.721 train_accuracy: 0.411 test_accuracy: 0.385\n",
            "[5,   835] train_loss: 1.777 train_accuracy: 0.407 test_accuracy: 0.380\n",
            "[5,   840] train_loss: 1.772 train_accuracy: 0.403 test_accuracy: 0.378\n",
            "[5,   845] train_loss: 1.770 train_accuracy: 0.395 test_accuracy: 0.382\n",
            "[5,   850] train_loss: 1.821 train_accuracy: 0.413 test_accuracy: 0.396\n",
            "[5,   855] train_loss: 1.827 train_accuracy: 0.409 test_accuracy: 0.388\n",
            "[5,   860] train_loss: 1.670 train_accuracy: 0.405 test_accuracy: 0.381\n",
            "[5,   865] train_loss: 1.793 train_accuracy: 0.402 test_accuracy: 0.373\n",
            "[5,   870] train_loss: 1.895 train_accuracy: 0.383 test_accuracy: 0.352\n",
            "[5,   875] train_loss: 1.798 train_accuracy: 0.399 test_accuracy: 0.378\n",
            "[5,   880] train_loss: 1.755 train_accuracy: 0.409 test_accuracy: 0.387\n",
            "[5,   885] train_loss: 1.692 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[5,   890] train_loss: 1.763 train_accuracy: 0.414 test_accuracy: 0.388\n",
            "[5,   895] train_loss: 1.789 train_accuracy: 0.412 test_accuracy: 0.389\n",
            "[5,   900] train_loss: 1.701 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[5,   905] train_loss: 1.716 train_accuracy: 0.408 test_accuracy: 0.388\n",
            "[5,   910] train_loss: 1.721 train_accuracy: 0.409 test_accuracy: 0.382\n",
            "[5,   915] train_loss: 1.788 train_accuracy: 0.398 test_accuracy: 0.378\n",
            "[5,   920] train_loss: 1.819 train_accuracy: 0.388 test_accuracy: 0.368\n",
            "[5,   925] train_loss: 1.872 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[5,   930] train_loss: 1.765 train_accuracy: 0.403 test_accuracy: 0.384\n",
            "[5,   935] train_loss: 1.675 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[5,   940] train_loss: 1.620 train_accuracy: 0.401 test_accuracy: 0.383\n",
            "[5,   945] train_loss: 1.849 train_accuracy: 0.396 test_accuracy: 0.376\n",
            "[5,   950] train_loss: 1.832 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[5,   955] train_loss: 1.810 train_accuracy: 0.405 test_accuracy: 0.375\n",
            "[5,   960] train_loss: 1.736 train_accuracy: 0.398 test_accuracy: 0.378\n",
            "[5,   965] train_loss: 1.704 train_accuracy: 0.399 test_accuracy: 0.374\n",
            "[5,   970] train_loss: 1.794 train_accuracy: 0.403 test_accuracy: 0.379\n",
            "[5,   975] train_loss: 1.830 train_accuracy: 0.413 test_accuracy: 0.382\n",
            "[5,   980] train_loss: 1.674 train_accuracy: 0.412 test_accuracy: 0.383\n",
            "[5,   985] train_loss: 1.793 train_accuracy: 0.395 test_accuracy: 0.373\n",
            "[5,   990] train_loss: 1.837 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[5,   995] train_loss: 1.820 train_accuracy: 0.413 test_accuracy: 0.390\n",
            "[5,  1000] train_loss: 1.901 train_accuracy: 0.405 test_accuracy: 0.390\n",
            "[5,  1005] train_loss: 1.850 train_accuracy: 0.407 test_accuracy: 0.391\n",
            "[5,  1010] train_loss: 1.742 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[5,  1015] train_loss: 1.788 train_accuracy: 0.400 test_accuracy: 0.383\n",
            "[5,  1020] train_loss: 1.722 train_accuracy: 0.400 test_accuracy: 0.384\n",
            "[5,  1025] train_loss: 1.772 train_accuracy: 0.404 test_accuracy: 0.383\n",
            "[5,  1030] train_loss: 1.714 train_accuracy: 0.400 test_accuracy: 0.378\n",
            "[5,  1035] train_loss: 1.858 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[5,  1040] train_loss: 1.824 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[5,  1045] train_loss: 1.703 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[5,  1050] train_loss: 1.801 train_accuracy: 0.405 test_accuracy: 0.386\n",
            "[5,  1055] train_loss: 1.668 train_accuracy: 0.406 test_accuracy: 0.389\n",
            "[5,  1060] train_loss: 1.729 train_accuracy: 0.407 test_accuracy: 0.384\n",
            "[5,  1065] train_loss: 1.650 train_accuracy: 0.416 test_accuracy: 0.385\n",
            "[5,  1070] train_loss: 1.732 train_accuracy: 0.402 test_accuracy: 0.383\n",
            "[5,  1075] train_loss: 1.692 train_accuracy: 0.393 test_accuracy: 0.381\n",
            "[5,  1080] train_loss: 1.595 train_accuracy: 0.402 test_accuracy: 0.385\n",
            "[5,  1085] train_loss: 1.787 train_accuracy: 0.406 test_accuracy: 0.375\n",
            "[5,  1090] train_loss: 1.695 train_accuracy: 0.422 test_accuracy: 0.387\n",
            "[5,  1095] train_loss: 1.830 train_accuracy: 0.411 test_accuracy: 0.376\n",
            "[5,  1100] train_loss: 1.733 train_accuracy: 0.403 test_accuracy: 0.374\n",
            "[5,  1105] train_loss: 1.757 train_accuracy: 0.412 test_accuracy: 0.385\n",
            "[5,  1110] train_loss: 1.797 train_accuracy: 0.416 test_accuracy: 0.392\n",
            "[5,  1115] train_loss: 1.836 train_accuracy: 0.414 test_accuracy: 0.389\n",
            "[5,  1120] train_loss: 1.804 train_accuracy: 0.408 test_accuracy: 0.385\n",
            "[5,  1125] train_loss: 1.734 train_accuracy: 0.406 test_accuracy: 0.380\n",
            "[5,  1130] train_loss: 1.748 train_accuracy: 0.408 test_accuracy: 0.383\n",
            "[5,  1135] train_loss: 1.740 train_accuracy: 0.416 test_accuracy: 0.391\n",
            "[5,  1140] train_loss: 1.741 train_accuracy: 0.408 test_accuracy: 0.381\n",
            "[5,  1145] train_loss: 1.609 train_accuracy: 0.410 test_accuracy: 0.375\n",
            "[5,  1150] train_loss: 1.896 train_accuracy: 0.402 test_accuracy: 0.373\n",
            "[5,  1155] train_loss: 1.671 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[5,  1160] train_loss: 1.733 train_accuracy: 0.395 test_accuracy: 0.373\n",
            "[5,  1165] train_loss: 1.664 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[5,  1170] train_loss: 1.691 train_accuracy: 0.410 test_accuracy: 0.395\n",
            "[5,  1175] train_loss: 1.815 train_accuracy: 0.419 test_accuracy: 0.391\n",
            "[5,  1180] train_loss: 1.699 train_accuracy: 0.413 test_accuracy: 0.383\n",
            "[5,  1185] train_loss: 1.854 train_accuracy: 0.411 test_accuracy: 0.379\n",
            "[5,  1190] train_loss: 1.678 train_accuracy: 0.415 test_accuracy: 0.384\n",
            "[5,  1195] train_loss: 1.757 train_accuracy: 0.410 test_accuracy: 0.380\n",
            "[5,  1200] train_loss: 1.764 train_accuracy: 0.408 test_accuracy: 0.378\n",
            "[5,  1205] train_loss: 1.838 train_accuracy: 0.411 test_accuracy: 0.385\n",
            "[5,  1210] train_loss: 1.797 train_accuracy: 0.398 test_accuracy: 0.373\n",
            "[5,  1215] train_loss: 1.707 train_accuracy: 0.410 test_accuracy: 0.384\n",
            "[5,  1220] train_loss: 1.741 train_accuracy: 0.401 test_accuracy: 0.378\n",
            "[5,  1225] train_loss: 1.671 train_accuracy: 0.405 test_accuracy: 0.382\n",
            "[5,  1230] train_loss: 1.687 train_accuracy: 0.405 test_accuracy: 0.382\n",
            "[5,  1235] train_loss: 1.720 train_accuracy: 0.398 test_accuracy: 0.379\n",
            "[5,  1240] train_loss: 1.757 train_accuracy: 0.406 test_accuracy: 0.387\n",
            "[5,  1245] train_loss: 1.721 train_accuracy: 0.412 test_accuracy: 0.387\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "# Writing training accuracy to file\n",
        "with open('Accuracy_a_train.txt', 'w') as file:\n",
        "    for i in range(len(a_train)):\n",
        "        file.write(str(a_train[i]))\n",
        "        if i < len(a_train) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing test accuracy to file\n",
        "with open('Accuracy_a_test.txt', 'w') as file:\n",
        "    for i in range(len(a_test)):\n",
        "        file.write(str(a_test[i]))\n",
        "        if i < len(a_test) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing loss values to file\n",
        "with open('Accuracy_loss.txt', 'w') as file:\n",
        "    for i in range(len(lossaaa)):\n",
        "        file.write(str(lossaaa[i]))\n",
        "        if i < len(lossaaa) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "FxwonJ737mdO"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Convert tensors to lists\n",
        "Inf_list = [tensor.item() for tensor in Inf]\n",
        "Var_av_list = [tensor.item() for tensor in Var_all]\n",
        "Generalization_Ratio_list = [tensor.item() for tensor in Generalization_Ratio_]\n",
        "\n",
        "# Writing Inf_list to file\n",
        "with open('Inf_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Inf_list)):\n",
        "        file.write(str(Inf_list[i]))\n",
        "        if i < len(Inf_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Var_av_list to file\n",
        "with open('Var_all_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Var_av_list)):\n",
        "        file.write(str(Var_av_list[i]))\n",
        "        if i < len(Var_av_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Generalization_Ratio_list to file\n",
        "with open('Generalization_Ratio_list.txt', 'w') as file:\n",
        "    for i in range(len(Generalization_Ratio_list)):\n",
        "        file.write(str(Generalization_Ratio_list[i]))\n",
        "        if i < len(Generalization_Ratio_list) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "AcrFOpRT7r4O"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import time\n",
        "import os  # Import the os module\n",
        "\n",
        "os.makedirs(os.path.join('./Models/'), exist_ok=True)  # Create the directory './Models/' if it doesn't exist\n",
        "model_path = './Models/'  # Define the model path\n",
        "\n",
        "rq = time.strftime('%Y%m%d%H%M', time.localtime(time.time()))  # Get the current time in the format 'YYYYMMDDHHMM'\n",
        "\n",
        "# Save the training results\n",
        "current_model_path = model_path + rq + \"_model.pkl\"  # Create the full path for the model file with the current timestamp\n",
        "torch.save(net, current_model_path)  # Save the model to the specified path\n",
        "print(\"Saved model file: \" + current_model_path)  # Print the path of the saved model file"
      ],
      "metadata": {
        "id": "47QTTvnd7y5V"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Display the highest value that appears during training\n",
        "print(\"train:\", max(a_train))  # Print the highest value in the training data\n",
        "print(\"test:\", max(a_test))  # Print the highest value in the test data\n",
        "print(\"loss:\", min(lossaaa))  # Print the minimum value of the loss"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "WHm_PQlw72lV",
        "outputId": "6ab7a3d9-1b65-48da-d67c-db8af8b0d8e8"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "train: 0.4225\n",
            "test: 0.3958\n",
            "loss: 1.5249487638473511\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "trainset = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "testset = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 test dataset\n",
        "trainloader = torch.utils.data.DataLoader(trainset, batch_size=50000, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "t_loader = torch.utils.data.DataLoader(testset, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "trainloader_iter = iter(trainloader)  # Create an iterator for the training DataLoader\n",
        "tl_image, tl_label = next(trainloader_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "tl_image = tl_image.cuda()  # Move training images to GPU\n",
        "tl_label = tl_label.cuda()  # Move training labels to GPU\n",
        "tl_imageoutputs = net(tl_image)  # [batch, 10]  # Get the outputs from the network for the training images\n",
        "predict_y = torch.max(tl_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy = torch.eq(predict_y, tl_label).sum().item() / tl_label.size(0)  # Calculate accuracy for the training set\n",
        "print(\"train:\", float(accuracy))  # Print the training accuracy\n",
        "\n",
        "t_data_iter = iter(t_loader)  # Create an iterator for the test DataLoader\n",
        "t_image, t_label = next(t_data_iter)  # Get the next batch of images and labels from the test DataLoader\n",
        "t_image = t_image.cuda()  # Move test images to GPU\n",
        "t_label = t_label.cuda()  # Move test labels to GPU\n",
        "t_imageoutputs = net(t_image)  # [batch, 10]  # Get the outputs from the network for the test images\n",
        "predict = torch.max(t_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy_t = torch.eq(predict, t_label).sum().item() / t_label.size(0)  # Calculate accuracy for the test set\n",
        "print(\"test:\", float(accuracy_t))  # Print the test accuracy"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "q8zaFqdG742C",
        "outputId": "bbfd3ba4-efdf-4f83-ae3e-a603a5aa86b0"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "train: 0.40658\n",
            "test: 0.3874\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### **Network1 : use only linear layers (not use GDP)**"
      ],
      "metadata": {
        "id": "auHqb2pK7eIi"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import argparse\n",
        "import os\n",
        "import numpy as np\n",
        "import torchvision.transforms as transforms\n",
        "from torchvision.utils import save_image\n",
        "from torch.utils.data import DataLoader\n",
        "from torchvision import datasets\n",
        "from torch.autograd import Variable\n",
        "import torch.nn as nn\n",
        "import torch\n",
        "\n",
        "class LLNet(nn.Module):  # Use only linear layers\n",
        "    def __init__(self):\n",
        "        super(LLNet, self).__init__()\n",
        "\n",
        "        self.fc1 = nn.Linear(3*32*32, 1000)  # First fully connected layer\n",
        "        self.fc2 = nn.Linear(1000, 500)      # Second fully connected layer\n",
        "        self.fc3 = nn.Linear(500, 100)       # Third fully connected layer\n",
        "        self.fc4 = nn.Linear(100, 50)        # Fourth fully connected layer\n",
        "        self.fc5 = nn.Linear(50, 25)         # Fifth fully connected layer\n",
        "        self.fc6 = nn.Linear(25, 20)         # Sixth fully connected layer\n",
        "        self.fc7 = nn.Linear(20, 10)         # Seventh fully connected layer (output layer)\n",
        "\n",
        "    def forward(self, x):\n",
        "        x = x.view(-1, 3*32*32)  # Flatten the input image\n",
        "        x = self.fc1(x)  # Apply first fully connected layer\n",
        "        x = self.fc2(x)  # Apply second fully connected layer\n",
        "        x = self.fc3(x)  # Apply third fully connected layer\n",
        "        x = self.fc4(x)  # Apply fourth fully connected layer\n",
        "        x = self.fc5(x)  # Apply fifth fully connected layer\n",
        "        x = self.fc6(x)  # Apply sixth fully connected layer\n",
        "        x = self.fc7(x)  # Apply seventh fully connected layer (output)\n",
        "        return x\n",
        "\n",
        "loss_function = torch.nn.CrossEntropyLoss()  # Define the loss function\n",
        "net = LLNet()  # Instantiate the network\n",
        "\n",
        "# If a GPU is available, run everything in CUDA mode\n",
        "if torch.cuda.is_available():\n",
        "    net = net.cuda()  # Move the network to GPU\n",
        "    loss_function = loss_function.cuda()  # Move the loss function to GPU\n",
        "\n",
        "optimizer_L = torch.optim.Adam(net.parameters(), lr=0.001)  # Define the optimizer with a learning rate of 0.001"
      ],
      "metadata": {
        "id": "Odj8TkCeY5sz"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import numpy as np\n",
        "import torch\n",
        "import torchvision\n",
        "import torch.nn as nn\n",
        "from matplotlib import pyplot as plt\n",
        "import random\n",
        "import torch.optim as optim\n",
        "import torchvision.transforms as transforms\n",
        "import time\n",
        "import torch.nn.functional as F\n",
        "from collections import Counter, defaultdict\n",
        "from itertools import combinations\n",
        "\n",
        "################################################ reload\n",
        "transform = transforms.Compose(\n",
        "    [transforms.ToTensor(),\n",
        "     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])  # Define the transformation to be applied to the images\n",
        "\n",
        "train_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "test_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)  # Load CIFAR-10 test dataset\n",
        "\n",
        "train_loader = torch.utils.data.DataLoader(train_set, batch_size=40, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "testloader = torch.utils.data.DataLoader(test_set, batch_size=40, shuffle=True, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "val_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 validation dataset\n",
        "val_loader = torch.utils.data.DataLoader(val_set, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for validation set\n",
        "val_data_iter = iter(val_loader)  # Create an iterator for the validation DataLoader\n",
        "val_image, val_label = next(val_data_iter)  # Get the next batch of images and labels from the validation DataLoader\n",
        "#print(val_image.shape)  # Print the shape of validation images\n",
        "\n",
        "##################\n",
        "tra_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=False, transform=transform)  # Load CIFAR-10 training dataset again\n",
        "tra_loader = torch.utils.data.DataLoader(tra_set, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for the training set\n",
        "tra_data_iter = iter(tra_loader)  # Create an iterator for the training DataLoader\n",
        "tra_image, tra_label = next(tra_data_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "\n",
        "##################\n",
        "classes = ('plane', 'car', 'bird', 'cat',  # Define the class labels\n",
        "           'deer', 'dog', 'frog', 'horse', 'ship', 'truck')\n",
        "\n",
        "optimizer = optim.Adam(net.parameters(), lr=0.001)  # Initialize the Adam optimizer with learning rate 0.001\n",
        "\n",
        "########################################################\n",
        "\n",
        "a_train = []  # To store training accuracy\n",
        "a_test = []  # To store test accuracy\n",
        "lossaaa = []  # To store loss values\n",
        "Inf = []  # To store information values\n",
        "Var_all = []  # To store all variation values\n",
        "Generalization_Ratio_ = []  # To store generalization ratios\n",
        "dicide_action = []  # To store decision actions\n",
        "loss_before = torch.tensor(30.0)  # Initial loss value\n",
        "los = torch.tensor(30.0)  # Initial loss value\n",
        "dis_before_A1 = torch.tensor(0)  # Distance before action A1\n",
        "dis_before_A2 = torch.tensor(0)  # Distance before action A2\n",
        "dis = torch.tensor(1)  # Distance increment\n",
        "per = \"N\"  # Previous iteration's action\n",
        "state_before = torch.tensor(0.0)  # Previous state value\n",
        "categrary_number = 10  # Number of categories\n",
        "tra_val_number = 2  # Training validation number\n",
        "\n",
        "for epoch in range(5):  # Loop over the dataset multiple times\n",
        "    e3412_iter = iter(e3412_loader)  # Iterator for e3412_loader\n",
        "    running_loss = 0.0  # Running loss\n",
        "    running_loss_all = 0.0  # Running loss for all\n",
        "    loss_before = Variable(loss_before, requires_grad=False)  # Make loss_before a variable\n",
        "    los = Variable(los, requires_grad=False)  # Make los a variable\n",
        "    state_before = Variable(state_before, requires_grad=False)  # Make state_before a variable\n",
        "    dis_before_A1 = Variable(dis_before_A1, requires_grad=False)  # Make dis_before_A1 a variable\n",
        "    dis_before_A2 = Variable(dis_before_A2, requires_grad=False)  # Make dis_before_A2 a variable\n",
        "    acc_A1 = Variable(dis_before_A1, requires_grad=False)  # Make acc_A1 a variable\n",
        "    acc_A2 = Variable(dis_before_A2, requires_grad=False)  # Make acc_A2 a variable\n",
        "    dis_ = Variable(dis, requires_grad=False)  # Make dis a variable\n",
        "\n",
        "    for step, (imgs, labels) in enumerate(e1234_loader):  # Iterate over the data\n",
        "        ### calculate losses\n",
        "        weight_val_probility = 1.0 / tra_val_number  # Weight for validation probability\n",
        "        labels = labels.cuda()  # Move labels to GPU\n",
        "        imgs = imgs.cuda()  # Move images to GPU\n",
        "        out_e1234 = net(imgs)  # Get output from the network\n",
        "        loss_out_e1234 = loss_function(out_e1234, labels)  # Calculate loss for e1234 (A1)\n",
        "\n",
        "        e3412_imgs, e3412_labels = next(e3412_iter)  # Get next batch from e3412_iter\n",
        "        e3412_imgs = e3412_imgs.cuda()  # Move e3412 images to GPU\n",
        "        e3412_labels = e3412_labels.cuda()  # Move e3412 labels to GPU\n",
        "        out_e3412 = net(e3412_imgs)  # Get output from the network\n",
        "        loss_out_e3412 = loss_function(out_e3412, e3412_labels)  # Calculate loss for e3412 (A3)\n",
        "\n",
        "        #################### extract\n",
        "        ## e1 ext count\n",
        "        e12_extracted_loader_image = e12_extracted_loader_image.cuda()  # Move e12 extracted images to GPU\n",
        "        e12_extracted_loader_label = e12_extracted_loader_label.cuda()  # Move e12 extracted labels to GPU\n",
        "        e12_extracted_out = net(e12_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e12_extracted = torch.max(e12_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ## e2 ext count\n",
        "        e34_extracted_loader_image = e34_extracted_loader_image.cuda()  # Move e34 extracted images to GPU\n",
        "        e34_extracted_loader_label = e34_extracted_loader_label.cuda()  # Move e34 extracted labels to GPU\n",
        "        e34_extracted_out = net(e34_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e34_extracted = torch.max(e34_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ########### e1 count\n",
        "        e12_s_loader_image = e12_s_loader_image.cuda()  # Move e12 sample images to GPU\n",
        "        e12_s_loader_label = e12_s_loader_label.cuda()  # Move e12 sample labels to GPU\n",
        "        e12_inform_out = net(e12_s_loader_image).detach()  # Get detached output from the network\n",
        "        e12_inform = torch.max(e12_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e12_inform = torch.chunk(e12_inform, 10)  # Split e12 inform into 10 chunks\n",
        "        split_e12_inform = list(split_e12_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e12_inform)):\n",
        "            counts_E12 = torch.bincount(split_e12_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e12 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e12[category] = counts_E12[category]  # Update counts\n",
        "            split_e12_inform[i] = counts_e12  # Store updated counts\n",
        "\n",
        "        ########### e2 count\n",
        "        e34_s_loader_image = e34_s_loader_image.cuda()  # Move e34 sample images to GPU\n",
        "        e34_s_loader_label = e34_s_loader_label.cuda()  # Move e34 sample labels to GPU\n",
        "        e34_inform_out = net(e34_s_loader_image).detach()  # Get detached output from the network\n",
        "        e34_inform = torch.max(e34_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e34_inform = torch.chunk(e34_inform, 10)  # Split e34 inform into 10 chunks\n",
        "        split_e34_inform = list(split_e34_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e34_inform)):\n",
        "            counts_E34 = torch.bincount(split_e34_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e34 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e34[category] = counts_E34[category]  # Update counts\n",
        "            split_e34_inform[i] = counts_e34  # Store updated counts\n",
        "\n",
        "        ##########\n",
        "        ## IN_IN_pro\n",
        "        counts_i_12 = torch.bincount(e12_inform, minlength=10)  # Count occurrences for e12 inform\n",
        "        counts_i_34 = torch.bincount(e34_inform, minlength=10)  # Count occurrences for e34 inform\n",
        "        counts_in_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_in_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_12[category] = counts_i_12[category]  # Update counts for e12\n",
        "        total_samples_in_12 = len(e12_inform)  # Total samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_34[category] = counts_i_34[category]  # Update counts for e34\n",
        "        total_samples_in_34 = len(e34_inform)  # Total samples in e34\n",
        "\n",
        "        min_denominator_in_12 = total_samples_in_12 * 1e-6  # Minimum denominator for e12\n",
        "        probabilities_in_12 = counts_in_12 / (total_samples_in_12 + min_denominator_in_12)  # Probabilities for e12\n",
        "        probabilities_tensor_in_12 = probabilities_in_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12\n",
        "\n",
        "        min_denominator_in_34 = total_samples_in_34 * 1e-6  # Minimum denominator for e34\n",
        "        probabilities_in_34 = counts_in_34 / (total_samples_in_34 + min_denominator_in_34)  # Probabilities for e34\n",
        "        probabilities_tensor_in_34 = probabilities_in_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34\n",
        "\n",
        "        counts_ext_12 = torch.bincount(e12_extracted, minlength=10)  # Count occurrences for e12 extracted\n",
        "        counts_ext_34 = torch.bincount(e34_extracted, minlength=10)  # Count occurrences for e34 extracted\n",
        "        counts_extra_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_extra_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_12[category] = counts_ext_12[category]  # Update counts for e12 extracted\n",
        "        total_extracted_in_12 = len(e12_extracted)  # Total extracted samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_34[category] = counts_ext_34[category]  # Update counts for e34 extracted\n",
        "        total_extracted_in_34 = len(e34_extracted)  # Total extracted samples in e34\n",
        "\n",
        "        min_denominator_ext_12 = total_extracted_in_12 * 1e-6  # Minimum denominator for e12 extracted\n",
        "        probabilities_ext_12 = counts_extra_12 / (total_extracted_in_12 + min_denominator_ext_12)  # Probabilities for e12 extracted\n",
        "        probabilities_tensor_extra_12 = probabilities_ext_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12 extracted\n",
        "\n",
        "        min_denominator_ext_34 = total_extracted_in_34 * 1e-6  # Minimum denominator for e34 extracted\n",
        "        probabilities_ext_34 = counts_extra_34 / (total_extracted_in_34 + min_denominator_ext_34)  # Probabilities for e34 extracted\n",
        "        probabilities_tensor_extra_34 = probabilities_ext_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34 extracted\n",
        "\n",
        "        ############################### Variation x ###################################\n",
        "        in_12_all = probabilities_tensor_in_12\n",
        "        in_34_all = probabilities_tensor_in_34\n",
        "        in_12_extra = probabilities_tensor_extra_12\n",
        "        in_34_extra = probabilities_tensor_extra_34\n",
        "        weight_tra_probility_all = 1.0 / 2\n",
        "        dow_all = \\\n",
        "              (in_12_all*weight_tra_probility_all + in_34_all*weight_tra_probility_all +\n",
        "              in_12_extra*weight_tra_probility_all + in_34_extra*weight_tra_probility_all + 1e-30)\n",
        "        in_1_all = (in_12_all*weight_tra_probility_all) / dow_all\n",
        "        in_2_all = (in_34_all*weight_tra_probility_all) / dow_all\n",
        "        e_1_all = (in_12_extra*weight_tra_probility_all) / dow_all\n",
        "        e_2_all = (in_34_extra*weight_tra_probility_all) / dow_all\n",
        "        in_1_all = in_1_all[0]\n",
        "        in_2_all = in_2_all[0]\n",
        "        e_1_all = e_1_all[0]\n",
        "        e_2_all = e_2_all[0]\n",
        "        d_KL_all = torch.zeros(10)\n",
        "        k_divergence_all = (in_1_all + 1e-30) * torch.log(in_1_all / (e_1_all + 1e-30) + 1e-30)\n",
        "        k_divergence_all_ = (in_1_all + 1e-30) * torch.log(in_1_all / (e_2_all + 1e-30) + 1e-30)\n",
        "        d_KL_all = torch.max(abs(k_divergence_all))\n",
        "        d_KL_all_ = torch.max(abs(k_divergence_all_))\n",
        "        Variation_all = torch.max(d_KL_all, d_KL_all_)\n",
        "        Var_all.append(Variation_all)\n",
        "\n",
        "        ############################ Information ###################################\n",
        "        all_combinations = list(combinations(range(10), 2))\n",
        "        K = categrary_number * (categrary_number - 1)\n",
        "        result_tensor = torch.zeros(len(all_combinations) * 2)  # Calculate the difference of each pair of combinations and store in result tensor\n",
        "        for c in range(10):\n",
        "            for idx, (i, j) in enumerate(all_combinations):\n",
        "                s1 = abs(((split_e12_inform[c][i]/10) + 1e-30) * torch.log((split_e12_inform[c][i]/10) / ((split_e12_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                s3 = abs(((split_e34_inform[c][i]/10) + 1e-30) * torch.log((split_e34_inform[c][i]/10) / ((split_e34_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                min_value = torch.min(s1, s3)\n",
        "                result_tensor[idx] = min_value.item()\n",
        "                idx_ = idx + len(all_combinations)\n",
        "                s1_ = abs(((split_e12_inform[c][j]/10) + 1e-30) * torch.log((split_e12_inform[c][j]/10) / ((split_e12_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                s3_ = abs(((split_e34_inform[c][j]/10) + 1e-30) * torch.log((split_e34_inform[c][j]/10) / ((split_e34_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                min_value_ = torch.min(s1_, s3_)\n",
        "                result_tensor[idx_] = min_value_.item()\n",
        "        Information = torch.sum(result_tensor) / K\n",
        "        Inf.append(Information)\n",
        "\n",
        "        ############################ Generalization_Ratio ###################################\n",
        "        Generalization_Ratio = Variation_all * (Information + 1.0) / Information\n",
        "        Generalization_Ratio_.append(Generalization_Ratio)\n",
        "\n",
        "        ############################ Generalization Decision Process (GDP) ###################################\n",
        "        state_now = Generalization_Ratio\n",
        "        loss_before = loss_before.cuda()\n",
        "        state_before = state_before.cuda()\n",
        "        state_dis = state_now - state_before\n",
        "        result_tensor = torch.cat((loss_out_e1234.unsqueeze(0), loss_out_e3412.unsqueeze(0)), 0)\n",
        "\n",
        "        # Because two datasets loss_out_e1234 and loss_out_e3412 are used, and there are actions A1 and A2,\n",
        "        # choose one based on the reward\n",
        "        if state_dis >= 0.0:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "        else:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "\n",
        "        ####################################\n",
        "        #### optimizer\n",
        "        los = loss - loss_before\n",
        "        ####################################\n",
        "        loss = loss_out_e1234  # Losses from not using the selection\n",
        "        ####################################\n",
        "        state_before = state_now\n",
        "        optimizer_L.zero_grad()\n",
        "        loss.backward()\n",
        "        optimizer_L.step()\n",
        "        loss_before = loss\n",
        "        running_loss += loss.item()\n",
        "\n",
        "        # Print statistics\n",
        "        if step % 5 == 4:  # Print every 500 mini-batches\n",
        "            with torch.no_grad():  # 'with' is a context manager\n",
        "                s_test_image = s_test_image.cuda()\n",
        "                s_test_label = s_test_label.cuda()\n",
        "                s_tra_image = s_tra_image.cuda()\n",
        "                s_tra_label = s_tra_label.cuda()\n",
        "                outputs = net(s_test_image)  # [batch, 10]\n",
        "                predict_y = torch.max(outputs, dim=1)[1]\n",
        "                accuracy = torch.eq(predict_y, s_test_label).sum().item() / s_test_label.size(0)\n",
        "                a_test.append(float(accuracy))\n",
        "                outputs_t = net(s_tra_image)  # [batch, 10]\n",
        "                predict_y_t = torch.max(outputs_t, dim=1)[1]\n",
        "                accuracy_t = torch.eq(predict_y_t, s_tra_label).sum().item() / s_tra_label.size(0)\n",
        "                a_train.append(float(accuracy_t))\n",
        "                lossaaa.append(float(running_loss / 5))\n",
        "                print('[%d, %5d] train_loss: %.3f train_accuracy: %.3f test_accuracy: %.3f' %\n",
        "                      (epoch + 1, step + 1, running_loss / 5, accuracy_t, accuracy))\n",
        "                running_loss = 0.0\n",
        "                running_loss = 0.0"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "oiQq_PO07dXB",
        "outputId": "53d04971-d268-4ce6-ee2c-dad5a85913b6"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "Files already downloaded and verified\n",
            "[1,     5] train_loss: 2.300 train_accuracy: 0.204 test_accuracy: 0.197\n",
            "[1,    10] train_loss: 2.114 train_accuracy: 0.254 test_accuracy: 0.250\n",
            "[1,    15] train_loss: 2.209 train_accuracy: 0.208 test_accuracy: 0.212\n",
            "[1,    20] train_loss: 2.156 train_accuracy: 0.197 test_accuracy: 0.204\n",
            "[1,    25] train_loss: 2.146 train_accuracy: 0.243 test_accuracy: 0.242\n",
            "[1,    30] train_loss: 2.082 train_accuracy: 0.253 test_accuracy: 0.247\n",
            "[1,    35] train_loss: 2.015 train_accuracy: 0.237 test_accuracy: 0.237\n",
            "[1,    40] train_loss: 2.111 train_accuracy: 0.262 test_accuracy: 0.268\n",
            "[1,    45] train_loss: 2.055 train_accuracy: 0.257 test_accuracy: 0.253\n",
            "[1,    50] train_loss: 2.011 train_accuracy: 0.250 test_accuracy: 0.243\n",
            "[1,    55] train_loss: 2.073 train_accuracy: 0.230 test_accuracy: 0.228\n",
            "[1,    60] train_loss: 2.007 train_accuracy: 0.270 test_accuracy: 0.267\n",
            "[1,    65] train_loss: 2.008 train_accuracy: 0.274 test_accuracy: 0.269\n",
            "[1,    70] train_loss: 2.040 train_accuracy: 0.284 test_accuracy: 0.282\n",
            "[1,    75] train_loss: 2.031 train_accuracy: 0.288 test_accuracy: 0.291\n",
            "[1,    80] train_loss: 1.962 train_accuracy: 0.280 test_accuracy: 0.278\n",
            "[1,    85] train_loss: 1.975 train_accuracy: 0.280 test_accuracy: 0.276\n",
            "[1,    90] train_loss: 2.002 train_accuracy: 0.289 test_accuracy: 0.286\n",
            "[1,    95] train_loss: 2.021 train_accuracy: 0.293 test_accuracy: 0.295\n",
            "[1,   100] train_loss: 2.011 train_accuracy: 0.292 test_accuracy: 0.293\n",
            "[1,   105] train_loss: 2.006 train_accuracy: 0.308 test_accuracy: 0.312\n",
            "[1,   110] train_loss: 1.941 train_accuracy: 0.292 test_accuracy: 0.298\n",
            "[1,   115] train_loss: 2.020 train_accuracy: 0.297 test_accuracy: 0.296\n",
            "[1,   120] train_loss: 1.896 train_accuracy: 0.296 test_accuracy: 0.298\n",
            "[1,   125] train_loss: 1.924 train_accuracy: 0.300 test_accuracy: 0.305\n",
            "[1,   130] train_loss: 2.022 train_accuracy: 0.302 test_accuracy: 0.305\n",
            "[1,   135] train_loss: 1.969 train_accuracy: 0.272 test_accuracy: 0.276\n",
            "[1,   140] train_loss: 1.971 train_accuracy: 0.286 test_accuracy: 0.285\n",
            "[1,   145] train_loss: 1.910 train_accuracy: 0.308 test_accuracy: 0.303\n",
            "[1,   150] train_loss: 1.885 train_accuracy: 0.319 test_accuracy: 0.309\n",
            "[1,   155] train_loss: 1.982 train_accuracy: 0.302 test_accuracy: 0.304\n",
            "[1,   160] train_loss: 1.948 train_accuracy: 0.311 test_accuracy: 0.303\n",
            "[1,   165] train_loss: 1.886 train_accuracy: 0.307 test_accuracy: 0.306\n",
            "[1,   170] train_loss: 2.008 train_accuracy: 0.288 test_accuracy: 0.297\n",
            "[1,   175] train_loss: 1.988 train_accuracy: 0.285 test_accuracy: 0.285\n",
            "[1,   180] train_loss: 2.067 train_accuracy: 0.274 test_accuracy: 0.276\n",
            "[1,   185] train_loss: 1.927 train_accuracy: 0.317 test_accuracy: 0.311\n",
            "[1,   190] train_loss: 1.880 train_accuracy: 0.328 test_accuracy: 0.327\n",
            "[1,   195] train_loss: 2.003 train_accuracy: 0.289 test_accuracy: 0.288\n",
            "[1,   200] train_loss: 1.902 train_accuracy: 0.309 test_accuracy: 0.303\n",
            "[1,   205] train_loss: 2.033 train_accuracy: 0.319 test_accuracy: 0.313\n",
            "[1,   210] train_loss: 1.942 train_accuracy: 0.325 test_accuracy: 0.320\n",
            "[1,   215] train_loss: 1.901 train_accuracy: 0.309 test_accuracy: 0.309\n",
            "[1,   220] train_loss: 1.933 train_accuracy: 0.313 test_accuracy: 0.315\n",
            "[1,   225] train_loss: 2.031 train_accuracy: 0.322 test_accuracy: 0.316\n",
            "[1,   230] train_loss: 1.920 train_accuracy: 0.327 test_accuracy: 0.328\n",
            "[1,   235] train_loss: 1.807 train_accuracy: 0.299 test_accuracy: 0.300\n",
            "[1,   240] train_loss: 1.849 train_accuracy: 0.320 test_accuracy: 0.317\n",
            "[1,   245] train_loss: 1.923 train_accuracy: 0.324 test_accuracy: 0.323\n",
            "[1,   250] train_loss: 2.004 train_accuracy: 0.306 test_accuracy: 0.312\n",
            "[1,   255] train_loss: 1.927 train_accuracy: 0.311 test_accuracy: 0.310\n",
            "[1,   260] train_loss: 2.038 train_accuracy: 0.325 test_accuracy: 0.318\n",
            "[1,   265] train_loss: 1.977 train_accuracy: 0.313 test_accuracy: 0.305\n",
            "[1,   270] train_loss: 1.910 train_accuracy: 0.299 test_accuracy: 0.285\n",
            "[1,   275] train_loss: 1.865 train_accuracy: 0.337 test_accuracy: 0.324\n",
            "[1,   280] train_loss: 1.987 train_accuracy: 0.307 test_accuracy: 0.304\n",
            "[1,   285] train_loss: 1.945 train_accuracy: 0.296 test_accuracy: 0.294\n",
            "[1,   290] train_loss: 2.061 train_accuracy: 0.335 test_accuracy: 0.330\n",
            "[1,   295] train_loss: 1.984 train_accuracy: 0.327 test_accuracy: 0.329\n",
            "[1,   300] train_loss: 1.906 train_accuracy: 0.332 test_accuracy: 0.331\n",
            "[1,   305] train_loss: 1.885 train_accuracy: 0.331 test_accuracy: 0.329\n",
            "[1,   310] train_loss: 1.883 train_accuracy: 0.314 test_accuracy: 0.312\n",
            "[1,   315] train_loss: 1.958 train_accuracy: 0.327 test_accuracy: 0.325\n",
            "[1,   320] train_loss: 1.977 train_accuracy: 0.327 test_accuracy: 0.323\n",
            "[1,   325] train_loss: 1.963 train_accuracy: 0.310 test_accuracy: 0.310\n",
            "[1,   330] train_loss: 1.975 train_accuracy: 0.298 test_accuracy: 0.297\n",
            "[1,   335] train_loss: 1.960 train_accuracy: 0.328 test_accuracy: 0.321\n",
            "[1,   340] train_loss: 1.923 train_accuracy: 0.327 test_accuracy: 0.324\n",
            "[1,   345] train_loss: 1.862 train_accuracy: 0.332 test_accuracy: 0.329\n",
            "[1,   350] train_loss: 1.874 train_accuracy: 0.332 test_accuracy: 0.326\n",
            "[1,   355] train_loss: 1.893 train_accuracy: 0.331 test_accuracy: 0.327\n",
            "[1,   360] train_loss: 1.868 train_accuracy: 0.343 test_accuracy: 0.341\n",
            "[1,   365] train_loss: 1.878 train_accuracy: 0.326 test_accuracy: 0.323\n",
            "[1,   370] train_loss: 1.792 train_accuracy: 0.314 test_accuracy: 0.312\n",
            "[1,   375] train_loss: 1.942 train_accuracy: 0.318 test_accuracy: 0.321\n",
            "[1,   380] train_loss: 1.938 train_accuracy: 0.327 test_accuracy: 0.320\n",
            "[1,   385] train_loss: 1.794 train_accuracy: 0.330 test_accuracy: 0.325\n",
            "[1,   390] train_loss: 1.932 train_accuracy: 0.336 test_accuracy: 0.334\n",
            "[1,   395] train_loss: 1.898 train_accuracy: 0.326 test_accuracy: 0.325\n",
            "[1,   400] train_loss: 1.861 train_accuracy: 0.326 test_accuracy: 0.321\n",
            "[1,   405] train_loss: 1.789 train_accuracy: 0.321 test_accuracy: 0.311\n",
            "[1,   410] train_loss: 1.976 train_accuracy: 0.321 test_accuracy: 0.307\n",
            "[1,   415] train_loss: 1.849 train_accuracy: 0.318 test_accuracy: 0.314\n",
            "[1,   420] train_loss: 1.880 train_accuracy: 0.334 test_accuracy: 0.332\n",
            "[1,   425] train_loss: 1.761 train_accuracy: 0.333 test_accuracy: 0.327\n",
            "[1,   430] train_loss: 1.839 train_accuracy: 0.317 test_accuracy: 0.313\n",
            "[1,   435] train_loss: 1.988 train_accuracy: 0.338 test_accuracy: 0.327\n",
            "[1,   440] train_loss: 1.978 train_accuracy: 0.337 test_accuracy: 0.330\n",
            "[1,   445] train_loss: 1.857 train_accuracy: 0.336 test_accuracy: 0.325\n",
            "[1,   450] train_loss: 1.819 train_accuracy: 0.352 test_accuracy: 0.345\n",
            "[1,   455] train_loss: 1.697 train_accuracy: 0.344 test_accuracy: 0.341\n",
            "[1,   460] train_loss: 1.970 train_accuracy: 0.336 test_accuracy: 0.335\n",
            "[1,   465] train_loss: 1.954 train_accuracy: 0.312 test_accuracy: 0.304\n",
            "[1,   470] train_loss: 1.818 train_accuracy: 0.321 test_accuracy: 0.313\n",
            "[1,   475] train_loss: 1.880 train_accuracy: 0.334 test_accuracy: 0.331\n",
            "[1,   480] train_loss: 1.929 train_accuracy: 0.343 test_accuracy: 0.338\n",
            "[1,   485] train_loss: 1.910 train_accuracy: 0.315 test_accuracy: 0.313\n",
            "[1,   490] train_loss: 1.865 train_accuracy: 0.332 test_accuracy: 0.333\n",
            "[1,   495] train_loss: 1.705 train_accuracy: 0.354 test_accuracy: 0.348\n",
            "[1,   500] train_loss: 1.732 train_accuracy: 0.343 test_accuracy: 0.331\n",
            "[1,   505] train_loss: 1.766 train_accuracy: 0.336 test_accuracy: 0.328\n",
            "[1,   510] train_loss: 1.886 train_accuracy: 0.327 test_accuracy: 0.333\n",
            "[1,   515] train_loss: 1.801 train_accuracy: 0.312 test_accuracy: 0.318\n",
            "[1,   520] train_loss: 1.911 train_accuracy: 0.350 test_accuracy: 0.348\n",
            "[1,   525] train_loss: 1.825 train_accuracy: 0.339 test_accuracy: 0.335\n",
            "[1,   530] train_loss: 1.946 train_accuracy: 0.339 test_accuracy: 0.332\n",
            "[1,   535] train_loss: 1.873 train_accuracy: 0.342 test_accuracy: 0.335\n",
            "[1,   540] train_loss: 1.865 train_accuracy: 0.343 test_accuracy: 0.335\n",
            "[1,   545] train_loss: 1.964 train_accuracy: 0.322 test_accuracy: 0.311\n",
            "[1,   550] train_loss: 1.729 train_accuracy: 0.346 test_accuracy: 0.338\n",
            "[1,   555] train_loss: 1.757 train_accuracy: 0.334 test_accuracy: 0.317\n",
            "[1,   560] train_loss: 1.906 train_accuracy: 0.340 test_accuracy: 0.338\n",
            "[1,   565] train_loss: 1.965 train_accuracy: 0.321 test_accuracy: 0.315\n",
            "[1,   570] train_loss: 1.900 train_accuracy: 0.330 test_accuracy: 0.319\n",
            "[1,   575] train_loss: 1.799 train_accuracy: 0.325 test_accuracy: 0.313\n",
            "[1,   580] train_loss: 1.908 train_accuracy: 0.350 test_accuracy: 0.337\n",
            "[1,   585] train_loss: 1.878 train_accuracy: 0.343 test_accuracy: 0.327\n",
            "[1,   590] train_loss: 1.816 train_accuracy: 0.331 test_accuracy: 0.317\n",
            "[1,   595] train_loss: 1.776 train_accuracy: 0.354 test_accuracy: 0.350\n",
            "[1,   600] train_loss: 1.908 train_accuracy: 0.349 test_accuracy: 0.344\n",
            "[1,   605] train_loss: 1.755 train_accuracy: 0.354 test_accuracy: 0.352\n",
            "[1,   610] train_loss: 1.809 train_accuracy: 0.351 test_accuracy: 0.346\n",
            "[1,   615] train_loss: 1.847 train_accuracy: 0.354 test_accuracy: 0.349\n",
            "[1,   620] train_loss: 1.774 train_accuracy: 0.361 test_accuracy: 0.350\n",
            "[1,   625] train_loss: 1.865 train_accuracy: 0.349 test_accuracy: 0.346\n",
            "[1,   630] train_loss: 1.993 train_accuracy: 0.340 test_accuracy: 0.340\n",
            "[1,   635] train_loss: 1.803 train_accuracy: 0.311 test_accuracy: 0.311\n",
            "[1,   640] train_loss: 1.907 train_accuracy: 0.345 test_accuracy: 0.340\n",
            "[1,   645] train_loss: 1.836 train_accuracy: 0.349 test_accuracy: 0.340\n",
            "[1,   650] train_loss: 1.825 train_accuracy: 0.352 test_accuracy: 0.345\n",
            "[1,   655] train_loss: 1.857 train_accuracy: 0.348 test_accuracy: 0.351\n",
            "[1,   660] train_loss: 1.856 train_accuracy: 0.329 test_accuracy: 0.322\n",
            "[1,   665] train_loss: 1.795 train_accuracy: 0.345 test_accuracy: 0.330\n",
            "[1,   670] train_loss: 1.929 train_accuracy: 0.362 test_accuracy: 0.351\n",
            "[1,   675] train_loss: 1.800 train_accuracy: 0.356 test_accuracy: 0.348\n",
            "[1,   680] train_loss: 1.865 train_accuracy: 0.352 test_accuracy: 0.344\n",
            "[1,   685] train_loss: 1.817 train_accuracy: 0.343 test_accuracy: 0.336\n",
            "[1,   690] train_loss: 1.947 train_accuracy: 0.352 test_accuracy: 0.352\n",
            "[1,   695] train_loss: 1.788 train_accuracy: 0.350 test_accuracy: 0.355\n",
            "[1,   700] train_loss: 1.905 train_accuracy: 0.355 test_accuracy: 0.358\n",
            "[1,   705] train_loss: 1.776 train_accuracy: 0.350 test_accuracy: 0.343\n",
            "[1,   710] train_loss: 1.930 train_accuracy: 0.339 test_accuracy: 0.329\n",
            "[1,   715] train_loss: 1.882 train_accuracy: 0.340 test_accuracy: 0.336\n",
            "[1,   720] train_loss: 1.770 train_accuracy: 0.353 test_accuracy: 0.337\n",
            "[1,   725] train_loss: 1.916 train_accuracy: 0.350 test_accuracy: 0.338\n",
            "[1,   730] train_loss: 1.921 train_accuracy: 0.361 test_accuracy: 0.349\n",
            "[1,   735] train_loss: 1.914 train_accuracy: 0.368 test_accuracy: 0.365\n",
            "[1,   740] train_loss: 1.819 train_accuracy: 0.356 test_accuracy: 0.355\n",
            "[1,   745] train_loss: 1.778 train_accuracy: 0.360 test_accuracy: 0.353\n",
            "[1,   750] train_loss: 1.855 train_accuracy: 0.346 test_accuracy: 0.336\n",
            "[1,   755] train_loss: 1.892 train_accuracy: 0.346 test_accuracy: 0.335\n",
            "[1,   760] train_loss: 1.910 train_accuracy: 0.356 test_accuracy: 0.344\n",
            "[1,   765] train_loss: 1.767 train_accuracy: 0.363 test_accuracy: 0.351\n",
            "[1,   770] train_loss: 1.921 train_accuracy: 0.374 test_accuracy: 0.370\n",
            "[1,   775] train_loss: 1.822 train_accuracy: 0.361 test_accuracy: 0.361\n",
            "[1,   780] train_loss: 1.968 train_accuracy: 0.346 test_accuracy: 0.350\n",
            "[1,   785] train_loss: 1.773 train_accuracy: 0.366 test_accuracy: 0.367\n",
            "[1,   790] train_loss: 1.732 train_accuracy: 0.365 test_accuracy: 0.360\n",
            "[1,   795] train_loss: 1.870 train_accuracy: 0.362 test_accuracy: 0.358\n",
            "[1,   800] train_loss: 1.910 train_accuracy: 0.343 test_accuracy: 0.335\n",
            "[1,   805] train_loss: 1.758 train_accuracy: 0.334 test_accuracy: 0.322\n",
            "[1,   810] train_loss: 1.805 train_accuracy: 0.362 test_accuracy: 0.357\n",
            "[1,   815] train_loss: 1.926 train_accuracy: 0.363 test_accuracy: 0.352\n",
            "[1,   820] train_loss: 1.755 train_accuracy: 0.375 test_accuracy: 0.364\n",
            "[1,   825] train_loss: 1.693 train_accuracy: 0.370 test_accuracy: 0.359\n",
            "[1,   830] train_loss: 1.770 train_accuracy: 0.365 test_accuracy: 0.363\n",
            "[1,   835] train_loss: 1.987 train_accuracy: 0.349 test_accuracy: 0.345\n",
            "[1,   840] train_loss: 1.783 train_accuracy: 0.345 test_accuracy: 0.343\n",
            "[1,   845] train_loss: 1.927 train_accuracy: 0.352 test_accuracy: 0.347\n",
            "[1,   850] train_loss: 1.820 train_accuracy: 0.363 test_accuracy: 0.354\n",
            "[1,   855] train_loss: 1.745 train_accuracy: 0.356 test_accuracy: 0.346\n",
            "[1,   860] train_loss: 1.792 train_accuracy: 0.358 test_accuracy: 0.353\n",
            "[1,   865] train_loss: 1.819 train_accuracy: 0.350 test_accuracy: 0.352\n",
            "[1,   870] train_loss: 1.842 train_accuracy: 0.370 test_accuracy: 0.362\n",
            "[1,   875] train_loss: 1.846 train_accuracy: 0.365 test_accuracy: 0.361\n",
            "[1,   880] train_loss: 1.912 train_accuracy: 0.368 test_accuracy: 0.358\n",
            "[1,   885] train_loss: 1.783 train_accuracy: 0.360 test_accuracy: 0.352\n",
            "[1,   890] train_loss: 1.826 train_accuracy: 0.363 test_accuracy: 0.353\n",
            "[1,   895] train_loss: 1.805 train_accuracy: 0.352 test_accuracy: 0.345\n",
            "[1,   900] train_loss: 1.804 train_accuracy: 0.359 test_accuracy: 0.350\n",
            "[1,   905] train_loss: 1.846 train_accuracy: 0.359 test_accuracy: 0.351\n",
            "[1,   910] train_loss: 1.823 train_accuracy: 0.358 test_accuracy: 0.346\n",
            "[1,   915] train_loss: 1.871 train_accuracy: 0.353 test_accuracy: 0.341\n",
            "[1,   920] train_loss: 1.899 train_accuracy: 0.369 test_accuracy: 0.360\n",
            "[1,   925] train_loss: 1.871 train_accuracy: 0.350 test_accuracy: 0.342\n",
            "[1,   930] train_loss: 1.847 train_accuracy: 0.364 test_accuracy: 0.357\n",
            "[1,   935] train_loss: 1.953 train_accuracy: 0.356 test_accuracy: 0.352\n",
            "[1,   940] train_loss: 1.787 train_accuracy: 0.349 test_accuracy: 0.345\n",
            "[1,   945] train_loss: 1.812 train_accuracy: 0.352 test_accuracy: 0.345\n",
            "[1,   950] train_loss: 1.861 train_accuracy: 0.359 test_accuracy: 0.342\n",
            "[1,   955] train_loss: 1.819 train_accuracy: 0.371 test_accuracy: 0.358\n",
            "[1,   960] train_loss: 1.890 train_accuracy: 0.377 test_accuracy: 0.368\n",
            "[1,   965] train_loss: 1.843 train_accuracy: 0.357 test_accuracy: 0.349\n",
            "[1,   970] train_loss: 1.836 train_accuracy: 0.357 test_accuracy: 0.349\n",
            "[1,   975] train_loss: 1.794 train_accuracy: 0.366 test_accuracy: 0.363\n",
            "[1,   980] train_loss: 1.833 train_accuracy: 0.352 test_accuracy: 0.347\n",
            "[1,   985] train_loss: 1.786 train_accuracy: 0.343 test_accuracy: 0.342\n",
            "[1,   990] train_loss: 1.870 train_accuracy: 0.355 test_accuracy: 0.356\n",
            "[1,   995] train_loss: 1.803 train_accuracy: 0.371 test_accuracy: 0.360\n",
            "[1,  1000] train_loss: 1.818 train_accuracy: 0.381 test_accuracy: 0.363\n",
            "[1,  1005] train_loss: 1.928 train_accuracy: 0.380 test_accuracy: 0.363\n",
            "[1,  1010] train_loss: 1.921 train_accuracy: 0.365 test_accuracy: 0.353\n",
            "[1,  1015] train_loss: 1.894 train_accuracy: 0.359 test_accuracy: 0.341\n",
            "[1,  1020] train_loss: 1.768 train_accuracy: 0.354 test_accuracy: 0.341\n",
            "[1,  1025] train_loss: 1.834 train_accuracy: 0.351 test_accuracy: 0.339\n",
            "[1,  1030] train_loss: 1.816 train_accuracy: 0.367 test_accuracy: 0.361\n",
            "[1,  1035] train_loss: 1.796 train_accuracy: 0.351 test_accuracy: 0.349\n",
            "[1,  1040] train_loss: 1.836 train_accuracy: 0.356 test_accuracy: 0.346\n",
            "[1,  1045] train_loss: 1.870 train_accuracy: 0.362 test_accuracy: 0.361\n",
            "[1,  1050] train_loss: 1.821 train_accuracy: 0.363 test_accuracy: 0.355\n",
            "[1,  1055] train_loss: 1.923 train_accuracy: 0.367 test_accuracy: 0.355\n",
            "[1,  1060] train_loss: 1.746 train_accuracy: 0.359 test_accuracy: 0.357\n",
            "[1,  1065] train_loss: 1.830 train_accuracy: 0.352 test_accuracy: 0.343\n",
            "[1,  1070] train_loss: 1.750 train_accuracy: 0.356 test_accuracy: 0.350\n",
            "[1,  1075] train_loss: 1.876 train_accuracy: 0.352 test_accuracy: 0.350\n",
            "[1,  1080] train_loss: 1.805 train_accuracy: 0.361 test_accuracy: 0.359\n",
            "[1,  1085] train_loss: 1.833 train_accuracy: 0.380 test_accuracy: 0.366\n",
            "[1,  1090] train_loss: 1.900 train_accuracy: 0.372 test_accuracy: 0.358\n",
            "[1,  1095] train_loss: 1.863 train_accuracy: 0.369 test_accuracy: 0.358\n",
            "[1,  1100] train_loss: 1.858 train_accuracy: 0.366 test_accuracy: 0.359\n",
            "[1,  1105] train_loss: 1.850 train_accuracy: 0.361 test_accuracy: 0.356\n",
            "[1,  1110] train_loss: 1.826 train_accuracy: 0.357 test_accuracy: 0.347\n",
            "[1,  1115] train_loss: 1.756 train_accuracy: 0.372 test_accuracy: 0.360\n",
            "[1,  1120] train_loss: 1.842 train_accuracy: 0.387 test_accuracy: 0.369\n",
            "[1,  1125] train_loss: 1.829 train_accuracy: 0.378 test_accuracy: 0.363\n",
            "[1,  1130] train_loss: 1.841 train_accuracy: 0.351 test_accuracy: 0.347\n",
            "[1,  1135] train_loss: 1.943 train_accuracy: 0.350 test_accuracy: 0.341\n",
            "[1,  1140] train_loss: 1.802 train_accuracy: 0.369 test_accuracy: 0.358\n",
            "[1,  1145] train_loss: 1.812 train_accuracy: 0.367 test_accuracy: 0.362\n",
            "[1,  1150] train_loss: 1.819 train_accuracy: 0.367 test_accuracy: 0.358\n",
            "[1,  1155] train_loss: 1.813 train_accuracy: 0.360 test_accuracy: 0.349\n",
            "[1,  1160] train_loss: 1.752 train_accuracy: 0.348 test_accuracy: 0.335\n",
            "[1,  1165] train_loss: 1.860 train_accuracy: 0.360 test_accuracy: 0.352\n",
            "[1,  1170] train_loss: 1.868 train_accuracy: 0.348 test_accuracy: 0.343\n",
            "[1,  1175] train_loss: 1.990 train_accuracy: 0.366 test_accuracy: 0.354\n",
            "[1,  1180] train_loss: 1.813 train_accuracy: 0.364 test_accuracy: 0.353\n",
            "[1,  1185] train_loss: 1.911 train_accuracy: 0.371 test_accuracy: 0.356\n",
            "[1,  1190] train_loss: 1.769 train_accuracy: 0.371 test_accuracy: 0.357\n",
            "[1,  1195] train_loss: 1.842 train_accuracy: 0.374 test_accuracy: 0.360\n",
            "[1,  1200] train_loss: 1.844 train_accuracy: 0.370 test_accuracy: 0.362\n",
            "[1,  1205] train_loss: 1.750 train_accuracy: 0.367 test_accuracy: 0.355\n",
            "[1,  1210] train_loss: 1.777 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[1,  1215] train_loss: 1.723 train_accuracy: 0.372 test_accuracy: 0.361\n",
            "[1,  1220] train_loss: 1.976 train_accuracy: 0.362 test_accuracy: 0.356\n",
            "[1,  1225] train_loss: 1.830 train_accuracy: 0.341 test_accuracy: 0.334\n",
            "[1,  1230] train_loss: 1.748 train_accuracy: 0.359 test_accuracy: 0.344\n",
            "[1,  1235] train_loss: 1.720 train_accuracy: 0.382 test_accuracy: 0.370\n",
            "[1,  1240] train_loss: 1.927 train_accuracy: 0.367 test_accuracy: 0.359\n",
            "[1,  1245] train_loss: 1.732 train_accuracy: 0.355 test_accuracy: 0.343\n",
            "[2,     5] train_loss: 1.952 train_accuracy: 0.347 test_accuracy: 0.336\n",
            "[2,    10] train_loss: 1.825 train_accuracy: 0.369 test_accuracy: 0.366\n",
            "[2,    15] train_loss: 1.894 train_accuracy: 0.360 test_accuracy: 0.351\n",
            "[2,    20] train_loss: 1.811 train_accuracy: 0.363 test_accuracy: 0.356\n",
            "[2,    25] train_loss: 1.918 train_accuracy: 0.368 test_accuracy: 0.363\n",
            "[2,    30] train_loss: 1.770 train_accuracy: 0.368 test_accuracy: 0.362\n",
            "[2,    35] train_loss: 1.702 train_accuracy: 0.355 test_accuracy: 0.354\n",
            "[2,    40] train_loss: 1.827 train_accuracy: 0.365 test_accuracy: 0.361\n",
            "[2,    45] train_loss: 1.853 train_accuracy: 0.380 test_accuracy: 0.368\n",
            "[2,    50] train_loss: 1.806 train_accuracy: 0.376 test_accuracy: 0.358\n",
            "[2,    55] train_loss: 1.724 train_accuracy: 0.373 test_accuracy: 0.359\n",
            "[2,    60] train_loss: 1.839 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[2,    65] train_loss: 1.777 train_accuracy: 0.371 test_accuracy: 0.357\n",
            "[2,    70] train_loss: 1.764 train_accuracy: 0.374 test_accuracy: 0.357\n",
            "[2,    75] train_loss: 1.822 train_accuracy: 0.364 test_accuracy: 0.352\n",
            "[2,    80] train_loss: 1.806 train_accuracy: 0.365 test_accuracy: 0.353\n",
            "[2,    85] train_loss: 1.924 train_accuracy: 0.371 test_accuracy: 0.357\n",
            "[2,    90] train_loss: 1.893 train_accuracy: 0.360 test_accuracy: 0.344\n",
            "[2,    95] train_loss: 1.764 train_accuracy: 0.370 test_accuracy: 0.356\n",
            "[2,   100] train_loss: 1.817 train_accuracy: 0.362 test_accuracy: 0.350\n",
            "[2,   105] train_loss: 1.858 train_accuracy: 0.368 test_accuracy: 0.352\n",
            "[2,   110] train_loss: 1.698 train_accuracy: 0.367 test_accuracy: 0.351\n",
            "[2,   115] train_loss: 1.816 train_accuracy: 0.349 test_accuracy: 0.336\n",
            "[2,   120] train_loss: 1.808 train_accuracy: 0.358 test_accuracy: 0.343\n",
            "[2,   125] train_loss: 1.875 train_accuracy: 0.373 test_accuracy: 0.354\n",
            "[2,   130] train_loss: 1.785 train_accuracy: 0.359 test_accuracy: 0.347\n",
            "[2,   135] train_loss: 1.901 train_accuracy: 0.366 test_accuracy: 0.355\n",
            "[2,   140] train_loss: 1.896 train_accuracy: 0.372 test_accuracy: 0.358\n",
            "[2,   145] train_loss: 1.866 train_accuracy: 0.355 test_accuracy: 0.342\n",
            "[2,   150] train_loss: 1.841 train_accuracy: 0.371 test_accuracy: 0.355\n",
            "[2,   155] train_loss: 1.836 train_accuracy: 0.358 test_accuracy: 0.349\n",
            "[2,   160] train_loss: 1.760 train_accuracy: 0.382 test_accuracy: 0.369\n",
            "[2,   165] train_loss: 1.791 train_accuracy: 0.363 test_accuracy: 0.352\n",
            "[2,   170] train_loss: 1.778 train_accuracy: 0.359 test_accuracy: 0.355\n",
            "[2,   175] train_loss: 1.849 train_accuracy: 0.357 test_accuracy: 0.354\n",
            "[2,   180] train_loss: 1.846 train_accuracy: 0.351 test_accuracy: 0.351\n",
            "[2,   185] train_loss: 2.018 train_accuracy: 0.353 test_accuracy: 0.346\n",
            "[2,   190] train_loss: 1.828 train_accuracy: 0.374 test_accuracy: 0.361\n",
            "[2,   195] train_loss: 1.812 train_accuracy: 0.374 test_accuracy: 0.363\n",
            "[2,   200] train_loss: 1.795 train_accuracy: 0.375 test_accuracy: 0.361\n",
            "[2,   205] train_loss: 1.721 train_accuracy: 0.374 test_accuracy: 0.363\n",
            "[2,   210] train_loss: 1.896 train_accuracy: 0.365 test_accuracy: 0.357\n",
            "[2,   215] train_loss: 1.752 train_accuracy: 0.371 test_accuracy: 0.358\n",
            "[2,   220] train_loss: 1.789 train_accuracy: 0.363 test_accuracy: 0.356\n",
            "[2,   225] train_loss: 1.840 train_accuracy: 0.352 test_accuracy: 0.342\n",
            "[2,   230] train_loss: 1.800 train_accuracy: 0.355 test_accuracy: 0.346\n",
            "[2,   235] train_loss: 1.878 train_accuracy: 0.370 test_accuracy: 0.361\n",
            "[2,   240] train_loss: 1.739 train_accuracy: 0.371 test_accuracy: 0.356\n",
            "[2,   245] train_loss: 1.800 train_accuracy: 0.376 test_accuracy: 0.365\n",
            "[2,   250] train_loss: 1.886 train_accuracy: 0.362 test_accuracy: 0.350\n",
            "[2,   255] train_loss: 1.732 train_accuracy: 0.370 test_accuracy: 0.356\n",
            "[2,   260] train_loss: 2.005 train_accuracy: 0.372 test_accuracy: 0.362\n",
            "[2,   265] train_loss: 1.847 train_accuracy: 0.343 test_accuracy: 0.342\n",
            "[2,   270] train_loss: 1.980 train_accuracy: 0.346 test_accuracy: 0.343\n",
            "[2,   275] train_loss: 1.781 train_accuracy: 0.366 test_accuracy: 0.356\n",
            "[2,   280] train_loss: 1.804 train_accuracy: 0.366 test_accuracy: 0.350\n",
            "[2,   285] train_loss: 1.806 train_accuracy: 0.351 test_accuracy: 0.341\n",
            "[2,   290] train_loss: 1.912 train_accuracy: 0.345 test_accuracy: 0.335\n",
            "[2,   295] train_loss: 1.821 train_accuracy: 0.341 test_accuracy: 0.342\n",
            "[2,   300] train_loss: 1.847 train_accuracy: 0.359 test_accuracy: 0.358\n",
            "[2,   305] train_loss: 1.850 train_accuracy: 0.360 test_accuracy: 0.349\n",
            "[2,   310] train_loss: 1.822 train_accuracy: 0.369 test_accuracy: 0.351\n",
            "[2,   315] train_loss: 1.661 train_accuracy: 0.381 test_accuracy: 0.370\n",
            "[2,   320] train_loss: 1.817 train_accuracy: 0.370 test_accuracy: 0.357\n",
            "[2,   325] train_loss: 1.971 train_accuracy: 0.377 test_accuracy: 0.365\n",
            "[2,   330] train_loss: 1.705 train_accuracy: 0.365 test_accuracy: 0.357\n",
            "[2,   335] train_loss: 1.749 train_accuracy: 0.370 test_accuracy: 0.361\n",
            "[2,   340] train_loss: 1.801 train_accuracy: 0.372 test_accuracy: 0.363\n",
            "[2,   345] train_loss: 1.859 train_accuracy: 0.374 test_accuracy: 0.368\n",
            "[2,   350] train_loss: 1.769 train_accuracy: 0.374 test_accuracy: 0.367\n",
            "[2,   355] train_loss: 1.811 train_accuracy: 0.383 test_accuracy: 0.376\n",
            "[2,   360] train_loss: 1.971 train_accuracy: 0.379 test_accuracy: 0.367\n",
            "[2,   365] train_loss: 1.858 train_accuracy: 0.378 test_accuracy: 0.367\n",
            "[2,   370] train_loss: 1.766 train_accuracy: 0.373 test_accuracy: 0.364\n",
            "[2,   375] train_loss: 1.572 train_accuracy: 0.361 test_accuracy: 0.355\n",
            "[2,   380] train_loss: 1.760 train_accuracy: 0.375 test_accuracy: 0.367\n",
            "[2,   385] train_loss: 1.902 train_accuracy: 0.371 test_accuracy: 0.359\n",
            "[2,   390] train_loss: 1.811 train_accuracy: 0.377 test_accuracy: 0.370\n",
            "[2,   395] train_loss: 1.671 train_accuracy: 0.371 test_accuracy: 0.361\n",
            "[2,   400] train_loss: 1.803 train_accuracy: 0.370 test_accuracy: 0.364\n",
            "[2,   405] train_loss: 1.788 train_accuracy: 0.370 test_accuracy: 0.363\n",
            "[2,   410] train_loss: 1.866 train_accuracy: 0.366 test_accuracy: 0.354\n",
            "[2,   415] train_loss: 1.882 train_accuracy: 0.363 test_accuracy: 0.357\n",
            "[2,   420] train_loss: 1.780 train_accuracy: 0.356 test_accuracy: 0.355\n",
            "[2,   425] train_loss: 1.930 train_accuracy: 0.375 test_accuracy: 0.370\n",
            "[2,   430] train_loss: 1.787 train_accuracy: 0.383 test_accuracy: 0.372\n",
            "[2,   435] train_loss: 1.796 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[2,   440] train_loss: 1.832 train_accuracy: 0.376 test_accuracy: 0.364\n",
            "[2,   445] train_loss: 1.875 train_accuracy: 0.381 test_accuracy: 0.372\n",
            "[2,   450] train_loss: 1.797 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[2,   455] train_loss: 1.788 train_accuracy: 0.371 test_accuracy: 0.365\n",
            "[2,   460] train_loss: 1.753 train_accuracy: 0.367 test_accuracy: 0.363\n",
            "[2,   465] train_loss: 1.772 train_accuracy: 0.367 test_accuracy: 0.354\n",
            "[2,   470] train_loss: 1.788 train_accuracy: 0.384 test_accuracy: 0.367\n",
            "[2,   475] train_loss: 1.671 train_accuracy: 0.375 test_accuracy: 0.366\n",
            "[2,   480] train_loss: 1.812 train_accuracy: 0.385 test_accuracy: 0.375\n",
            "[2,   485] train_loss: 1.846 train_accuracy: 0.378 test_accuracy: 0.365\n",
            "[2,   490] train_loss: 1.785 train_accuracy: 0.364 test_accuracy: 0.349\n",
            "[2,   495] train_loss: 1.842 train_accuracy: 0.368 test_accuracy: 0.349\n",
            "[2,   500] train_loss: 1.781 train_accuracy: 0.365 test_accuracy: 0.352\n",
            "[2,   505] train_loss: 1.793 train_accuracy: 0.377 test_accuracy: 0.364\n",
            "[2,   510] train_loss: 1.774 train_accuracy: 0.378 test_accuracy: 0.363\n",
            "[2,   515] train_loss: 1.765 train_accuracy: 0.353 test_accuracy: 0.339\n",
            "[2,   520] train_loss: 1.667 train_accuracy: 0.366 test_accuracy: 0.360\n",
            "[2,   525] train_loss: 1.820 train_accuracy: 0.371 test_accuracy: 0.356\n",
            "[2,   530] train_loss: 1.849 train_accuracy: 0.370 test_accuracy: 0.355\n",
            "[2,   535] train_loss: 1.784 train_accuracy: 0.376 test_accuracy: 0.357\n",
            "[2,   540] train_loss: 1.829 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[2,   545] train_loss: 1.794 train_accuracy: 0.369 test_accuracy: 0.358\n",
            "[2,   550] train_loss: 1.801 train_accuracy: 0.364 test_accuracy: 0.355\n",
            "[2,   555] train_loss: 1.797 train_accuracy: 0.388 test_accuracy: 0.371\n",
            "[2,   560] train_loss: 1.802 train_accuracy: 0.374 test_accuracy: 0.363\n",
            "[2,   565] train_loss: 1.775 train_accuracy: 0.375 test_accuracy: 0.363\n",
            "[2,   570] train_loss: 1.723 train_accuracy: 0.384 test_accuracy: 0.373\n",
            "[2,   575] train_loss: 1.771 train_accuracy: 0.367 test_accuracy: 0.366\n",
            "[2,   580] train_loss: 1.796 train_accuracy: 0.372 test_accuracy: 0.367\n",
            "[2,   585] train_loss: 1.787 train_accuracy: 0.382 test_accuracy: 0.374\n",
            "[2,   590] train_loss: 1.807 train_accuracy: 0.386 test_accuracy: 0.365\n",
            "[2,   595] train_loss: 1.696 train_accuracy: 0.374 test_accuracy: 0.356\n",
            "[2,   600] train_loss: 1.864 train_accuracy: 0.377 test_accuracy: 0.358\n",
            "[2,   605] train_loss: 1.777 train_accuracy: 0.376 test_accuracy: 0.364\n",
            "[2,   610] train_loss: 1.602 train_accuracy: 0.364 test_accuracy: 0.354\n",
            "[2,   615] train_loss: 1.694 train_accuracy: 0.366 test_accuracy: 0.357\n",
            "[2,   620] train_loss: 1.862 train_accuracy: 0.373 test_accuracy: 0.361\n",
            "[2,   625] train_loss: 1.648 train_accuracy: 0.366 test_accuracy: 0.356\n",
            "[2,   630] train_loss: 1.852 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[2,   635] train_loss: 1.761 train_accuracy: 0.374 test_accuracy: 0.362\n",
            "[2,   640] train_loss: 1.745 train_accuracy: 0.366 test_accuracy: 0.356\n",
            "[2,   645] train_loss: 1.805 train_accuracy: 0.376 test_accuracy: 0.361\n",
            "[2,   650] train_loss: 1.708 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[2,   655] train_loss: 1.812 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,   660] train_loss: 1.952 train_accuracy: 0.379 test_accuracy: 0.357\n",
            "[2,   665] train_loss: 1.755 train_accuracy: 0.373 test_accuracy: 0.353\n",
            "[2,   670] train_loss: 1.775 train_accuracy: 0.359 test_accuracy: 0.350\n",
            "[2,   675] train_loss: 1.895 train_accuracy: 0.367 test_accuracy: 0.364\n",
            "[2,   680] train_loss: 1.793 train_accuracy: 0.373 test_accuracy: 0.357\n",
            "[2,   685] train_loss: 1.881 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,   690] train_loss: 1.805 train_accuracy: 0.364 test_accuracy: 0.356\n",
            "[2,   695] train_loss: 1.842 train_accuracy: 0.372 test_accuracy: 0.364\n",
            "[2,   700] train_loss: 1.795 train_accuracy: 0.369 test_accuracy: 0.361\n",
            "[2,   705] train_loss: 1.920 train_accuracy: 0.363 test_accuracy: 0.355\n",
            "[2,   710] train_loss: 1.833 train_accuracy: 0.364 test_accuracy: 0.348\n",
            "[2,   715] train_loss: 1.824 train_accuracy: 0.384 test_accuracy: 0.365\n",
            "[2,   720] train_loss: 1.772 train_accuracy: 0.373 test_accuracy: 0.353\n",
            "[2,   725] train_loss: 1.761 train_accuracy: 0.369 test_accuracy: 0.354\n",
            "[2,   730] train_loss: 1.769 train_accuracy: 0.370 test_accuracy: 0.357\n",
            "[2,   735] train_loss: 1.784 train_accuracy: 0.363 test_accuracy: 0.350\n",
            "[2,   740] train_loss: 1.810 train_accuracy: 0.367 test_accuracy: 0.353\n",
            "[2,   745] train_loss: 1.876 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,   750] train_loss: 1.795 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[2,   755] train_loss: 1.782 train_accuracy: 0.382 test_accuracy: 0.360\n",
            "[2,   760] train_loss: 1.659 train_accuracy: 0.376 test_accuracy: 0.364\n",
            "[2,   765] train_loss: 1.812 train_accuracy: 0.360 test_accuracy: 0.357\n",
            "[2,   770] train_loss: 1.692 train_accuracy: 0.373 test_accuracy: 0.355\n",
            "[2,   775] train_loss: 1.718 train_accuracy: 0.364 test_accuracy: 0.351\n",
            "[2,   780] train_loss: 1.894 train_accuracy: 0.383 test_accuracy: 0.364\n",
            "[2,   785] train_loss: 1.981 train_accuracy: 0.380 test_accuracy: 0.362\n",
            "[2,   790] train_loss: 1.795 train_accuracy: 0.368 test_accuracy: 0.359\n",
            "[2,   795] train_loss: 1.849 train_accuracy: 0.364 test_accuracy: 0.353\n",
            "[2,   800] train_loss: 1.780 train_accuracy: 0.375 test_accuracy: 0.363\n",
            "[2,   805] train_loss: 1.751 train_accuracy: 0.385 test_accuracy: 0.375\n",
            "[2,   810] train_loss: 1.722 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[2,   815] train_loss: 1.809 train_accuracy: 0.382 test_accuracy: 0.363\n",
            "[2,   820] train_loss: 1.729 train_accuracy: 0.376 test_accuracy: 0.361\n",
            "[2,   825] train_loss: 1.798 train_accuracy: 0.369 test_accuracy: 0.353\n",
            "[2,   830] train_loss: 1.877 train_accuracy: 0.381 test_accuracy: 0.363\n",
            "[2,   835] train_loss: 1.948 train_accuracy: 0.387 test_accuracy: 0.374\n",
            "[2,   840] train_loss: 1.825 train_accuracy: 0.375 test_accuracy: 0.362\n",
            "[2,   845] train_loss: 1.783 train_accuracy: 0.384 test_accuracy: 0.377\n",
            "[2,   850] train_loss: 1.738 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[2,   855] train_loss: 1.658 train_accuracy: 0.386 test_accuracy: 0.366\n",
            "[2,   860] train_loss: 1.857 train_accuracy: 0.384 test_accuracy: 0.369\n",
            "[2,   865] train_loss: 1.733 train_accuracy: 0.381 test_accuracy: 0.362\n",
            "[2,   870] train_loss: 1.656 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[2,   875] train_loss: 1.676 train_accuracy: 0.379 test_accuracy: 0.361\n",
            "[2,   880] train_loss: 1.958 train_accuracy: 0.370 test_accuracy: 0.351\n",
            "[2,   885] train_loss: 1.845 train_accuracy: 0.375 test_accuracy: 0.355\n",
            "[2,   890] train_loss: 1.791 train_accuracy: 0.389 test_accuracy: 0.368\n",
            "[2,   895] train_loss: 1.667 train_accuracy: 0.393 test_accuracy: 0.362\n",
            "[2,   900] train_loss: 1.804 train_accuracy: 0.382 test_accuracy: 0.367\n",
            "[2,   905] train_loss: 1.809 train_accuracy: 0.372 test_accuracy: 0.354\n",
            "[2,   910] train_loss: 1.745 train_accuracy: 0.383 test_accuracy: 0.368\n",
            "[2,   915] train_loss: 1.755 train_accuracy: 0.384 test_accuracy: 0.370\n",
            "[2,   920] train_loss: 1.794 train_accuracy: 0.368 test_accuracy: 0.349\n",
            "[2,   925] train_loss: 1.828 train_accuracy: 0.362 test_accuracy: 0.354\n",
            "[2,   930] train_loss: 1.843 train_accuracy: 0.383 test_accuracy: 0.367\n",
            "[2,   935] train_loss: 1.714 train_accuracy: 0.368 test_accuracy: 0.356\n",
            "[2,   940] train_loss: 1.670 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[2,   945] train_loss: 1.651 train_accuracy: 0.379 test_accuracy: 0.355\n",
            "[2,   950] train_loss: 1.641 train_accuracy: 0.385 test_accuracy: 0.369\n",
            "[2,   955] train_loss: 1.869 train_accuracy: 0.372 test_accuracy: 0.355\n",
            "[2,   960] train_loss: 1.891 train_accuracy: 0.372 test_accuracy: 0.357\n",
            "[2,   965] train_loss: 1.846 train_accuracy: 0.369 test_accuracy: 0.354\n",
            "[2,   970] train_loss: 1.832 train_accuracy: 0.377 test_accuracy: 0.361\n",
            "[2,   975] train_loss: 1.730 train_accuracy: 0.387 test_accuracy: 0.373\n",
            "[2,   980] train_loss: 1.759 train_accuracy: 0.384 test_accuracy: 0.371\n",
            "[2,   985] train_loss: 1.809 train_accuracy: 0.379 test_accuracy: 0.366\n",
            "[2,   990] train_loss: 1.828 train_accuracy: 0.387 test_accuracy: 0.376\n",
            "[2,   995] train_loss: 1.937 train_accuracy: 0.385 test_accuracy: 0.379\n",
            "[2,  1000] train_loss: 1.881 train_accuracy: 0.365 test_accuracy: 0.353\n",
            "[2,  1005] train_loss: 1.734 train_accuracy: 0.381 test_accuracy: 0.365\n",
            "[2,  1010] train_loss: 1.807 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[2,  1015] train_loss: 1.772 train_accuracy: 0.376 test_accuracy: 0.370\n",
            "[2,  1020] train_loss: 1.798 train_accuracy: 0.378 test_accuracy: 0.369\n",
            "[2,  1025] train_loss: 1.711 train_accuracy: 0.398 test_accuracy: 0.380\n",
            "[2,  1030] train_loss: 1.841 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[2,  1035] train_loss: 1.605 train_accuracy: 0.384 test_accuracy: 0.371\n",
            "[2,  1040] train_loss: 1.916 train_accuracy: 0.384 test_accuracy: 0.373\n",
            "[2,  1045] train_loss: 1.734 train_accuracy: 0.379 test_accuracy: 0.365\n",
            "[2,  1050] train_loss: 1.782 train_accuracy: 0.371 test_accuracy: 0.360\n",
            "[2,  1055] train_loss: 1.765 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[2,  1060] train_loss: 1.781 train_accuracy: 0.382 test_accuracy: 0.371\n",
            "[2,  1065] train_loss: 1.579 train_accuracy: 0.384 test_accuracy: 0.374\n",
            "[2,  1070] train_loss: 1.803 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[2,  1075] train_loss: 1.881 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[2,  1080] train_loss: 1.840 train_accuracy: 0.372 test_accuracy: 0.355\n",
            "[2,  1085] train_loss: 1.870 train_accuracy: 0.378 test_accuracy: 0.365\n",
            "[2,  1090] train_loss: 1.775 train_accuracy: 0.377 test_accuracy: 0.366\n",
            "[2,  1095] train_loss: 1.725 train_accuracy: 0.377 test_accuracy: 0.364\n",
            "[2,  1100] train_loss: 1.689 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[2,  1105] train_loss: 1.790 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[2,  1110] train_loss: 1.805 train_accuracy: 0.398 test_accuracy: 0.386\n",
            "[2,  1115] train_loss: 1.907 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[2,  1120] train_loss: 1.738 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[2,  1125] train_loss: 1.773 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[2,  1130] train_loss: 1.817 train_accuracy: 0.361 test_accuracy: 0.349\n",
            "[2,  1135] train_loss: 1.737 train_accuracy: 0.378 test_accuracy: 0.360\n",
            "[2,  1140] train_loss: 1.787 train_accuracy: 0.383 test_accuracy: 0.365\n",
            "[2,  1145] train_loss: 1.671 train_accuracy: 0.380 test_accuracy: 0.359\n",
            "[2,  1150] train_loss: 1.651 train_accuracy: 0.387 test_accuracy: 0.365\n",
            "[2,  1155] train_loss: 1.694 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[2,  1160] train_loss: 1.857 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[2,  1165] train_loss: 1.788 train_accuracy: 0.357 test_accuracy: 0.349\n",
            "[2,  1170] train_loss: 1.683 train_accuracy: 0.369 test_accuracy: 0.356\n",
            "[2,  1175] train_loss: 1.797 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[2,  1180] train_loss: 1.821 train_accuracy: 0.392 test_accuracy: 0.372\n",
            "[2,  1185] train_loss: 1.788 train_accuracy: 0.387 test_accuracy: 0.368\n",
            "[2,  1190] train_loss: 1.790 train_accuracy: 0.374 test_accuracy: 0.359\n",
            "[2,  1195] train_loss: 1.745 train_accuracy: 0.380 test_accuracy: 0.369\n",
            "[2,  1200] train_loss: 1.791 train_accuracy: 0.382 test_accuracy: 0.375\n",
            "[2,  1205] train_loss: 1.913 train_accuracy: 0.370 test_accuracy: 0.357\n",
            "[2,  1210] train_loss: 1.774 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[2,  1215] train_loss: 1.821 train_accuracy: 0.388 test_accuracy: 0.365\n",
            "[2,  1220] train_loss: 1.923 train_accuracy: 0.384 test_accuracy: 0.367\n",
            "[2,  1225] train_loss: 1.798 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[2,  1230] train_loss: 1.791 train_accuracy: 0.389 test_accuracy: 0.376\n",
            "[2,  1235] train_loss: 1.807 train_accuracy: 0.384 test_accuracy: 0.373\n",
            "[2,  1240] train_loss: 1.676 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[2,  1245] train_loss: 1.773 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[3,     5] train_loss: 1.695 train_accuracy: 0.380 test_accuracy: 0.366\n",
            "[3,    10] train_loss: 1.868 train_accuracy: 0.377 test_accuracy: 0.366\n",
            "[3,    15] train_loss: 1.763 train_accuracy: 0.380 test_accuracy: 0.375\n",
            "[3,    20] train_loss: 1.678 train_accuracy: 0.382 test_accuracy: 0.369\n",
            "[3,    25] train_loss: 1.840 train_accuracy: 0.388 test_accuracy: 0.368\n",
            "[3,    30] train_loss: 1.803 train_accuracy: 0.395 test_accuracy: 0.374\n",
            "[3,    35] train_loss: 1.889 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[3,    40] train_loss: 1.681 train_accuracy: 0.393 test_accuracy: 0.380\n",
            "[3,    45] train_loss: 1.715 train_accuracy: 0.390 test_accuracy: 0.376\n",
            "[3,    50] train_loss: 1.842 train_accuracy: 0.385 test_accuracy: 0.375\n",
            "[3,    55] train_loss: 1.794 train_accuracy: 0.388 test_accuracy: 0.374\n",
            "[3,    60] train_loss: 1.700 train_accuracy: 0.380 test_accuracy: 0.363\n",
            "[3,    65] train_loss: 1.665 train_accuracy: 0.386 test_accuracy: 0.368\n",
            "[3,    70] train_loss: 1.693 train_accuracy: 0.384 test_accuracy: 0.369\n",
            "[3,    75] train_loss: 1.777 train_accuracy: 0.390 test_accuracy: 0.378\n",
            "[3,    80] train_loss: 1.757 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[3,    85] train_loss: 1.766 train_accuracy: 0.391 test_accuracy: 0.379\n",
            "[3,    90] train_loss: 1.726 train_accuracy: 0.375 test_accuracy: 0.360\n",
            "[3,    95] train_loss: 1.726 train_accuracy: 0.392 test_accuracy: 0.372\n",
            "[3,   100] train_loss: 1.646 train_accuracy: 0.388 test_accuracy: 0.372\n",
            "[3,   105] train_loss: 1.762 train_accuracy: 0.385 test_accuracy: 0.366\n",
            "[3,   110] train_loss: 1.775 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[3,   115] train_loss: 1.736 train_accuracy: 0.384 test_accuracy: 0.366\n",
            "[3,   120] train_loss: 1.759 train_accuracy: 0.383 test_accuracy: 0.365\n",
            "[3,   125] train_loss: 1.802 train_accuracy: 0.388 test_accuracy: 0.366\n",
            "[3,   130] train_loss: 1.670 train_accuracy: 0.373 test_accuracy: 0.363\n",
            "[3,   135] train_loss: 1.830 train_accuracy: 0.381 test_accuracy: 0.370\n",
            "[3,   140] train_loss: 1.905 train_accuracy: 0.387 test_accuracy: 0.366\n",
            "[3,   145] train_loss: 1.855 train_accuracy: 0.377 test_accuracy: 0.364\n",
            "[3,   150] train_loss: 1.799 train_accuracy: 0.374 test_accuracy: 0.360\n",
            "[3,   155] train_loss: 1.807 train_accuracy: 0.381 test_accuracy: 0.362\n",
            "[3,   160] train_loss: 1.725 train_accuracy: 0.377 test_accuracy: 0.365\n",
            "[3,   165] train_loss: 1.743 train_accuracy: 0.377 test_accuracy: 0.369\n",
            "[3,   170] train_loss: 1.846 train_accuracy: 0.386 test_accuracy: 0.376\n",
            "[3,   175] train_loss: 1.814 train_accuracy: 0.392 test_accuracy: 0.389\n",
            "[3,   180] train_loss: 1.719 train_accuracy: 0.390 test_accuracy: 0.377\n",
            "[3,   185] train_loss: 1.857 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[3,   190] train_loss: 1.628 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[3,   195] train_loss: 1.654 train_accuracy: 0.385 test_accuracy: 0.372\n",
            "[3,   200] train_loss: 1.733 train_accuracy: 0.397 test_accuracy: 0.384\n",
            "[3,   205] train_loss: 1.717 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[3,   210] train_loss: 1.651 train_accuracy: 0.396 test_accuracy: 0.380\n",
            "[3,   215] train_loss: 1.811 train_accuracy: 0.384 test_accuracy: 0.372\n",
            "[3,   220] train_loss: 1.856 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[3,   225] train_loss: 1.854 train_accuracy: 0.379 test_accuracy: 0.357\n",
            "[3,   230] train_loss: 1.840 train_accuracy: 0.393 test_accuracy: 0.368\n",
            "[3,   235] train_loss: 1.810 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[3,   240] train_loss: 1.780 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[3,   245] train_loss: 1.817 train_accuracy: 0.385 test_accuracy: 0.366\n",
            "[3,   250] train_loss: 1.717 train_accuracy: 0.386 test_accuracy: 0.365\n",
            "[3,   255] train_loss: 1.909 train_accuracy: 0.401 test_accuracy: 0.385\n",
            "[3,   260] train_loss: 1.736 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   265] train_loss: 1.829 train_accuracy: 0.402 test_accuracy: 0.382\n",
            "[3,   270] train_loss: 1.765 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[3,   275] train_loss: 1.752 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[3,   280] train_loss: 1.894 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[3,   285] train_loss: 1.595 train_accuracy: 0.373 test_accuracy: 0.349\n",
            "[3,   290] train_loss: 1.895 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[3,   295] train_loss: 1.668 train_accuracy: 0.402 test_accuracy: 0.386\n",
            "[3,   300] train_loss: 1.803 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,   305] train_loss: 1.758 train_accuracy: 0.381 test_accuracy: 0.360\n",
            "[3,   310] train_loss: 1.775 train_accuracy: 0.389 test_accuracy: 0.369\n",
            "[3,   315] train_loss: 1.816 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[3,   320] train_loss: 1.706 train_accuracy: 0.388 test_accuracy: 0.378\n",
            "[3,   325] train_loss: 1.701 train_accuracy: 0.379 test_accuracy: 0.367\n",
            "[3,   330] train_loss: 1.754 train_accuracy: 0.373 test_accuracy: 0.351\n",
            "[3,   335] train_loss: 1.704 train_accuracy: 0.380 test_accuracy: 0.363\n",
            "[3,   340] train_loss: 1.737 train_accuracy: 0.392 test_accuracy: 0.371\n",
            "[3,   345] train_loss: 1.737 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[3,   350] train_loss: 1.647 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[3,   355] train_loss: 1.722 train_accuracy: 0.370 test_accuracy: 0.357\n",
            "[3,   360] train_loss: 1.897 train_accuracy: 0.377 test_accuracy: 0.365\n",
            "[3,   365] train_loss: 1.938 train_accuracy: 0.379 test_accuracy: 0.367\n",
            "[3,   370] train_loss: 1.684 train_accuracy: 0.373 test_accuracy: 0.358\n",
            "[3,   375] train_loss: 1.970 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[3,   380] train_loss: 1.821 train_accuracy: 0.381 test_accuracy: 0.365\n",
            "[3,   385] train_loss: 1.808 train_accuracy: 0.391 test_accuracy: 0.378\n",
            "[3,   390] train_loss: 1.709 train_accuracy: 0.386 test_accuracy: 0.372\n",
            "[3,   395] train_loss: 1.750 train_accuracy: 0.385 test_accuracy: 0.371\n",
            "[3,   400] train_loss: 1.772 train_accuracy: 0.389 test_accuracy: 0.373\n",
            "[3,   405] train_loss: 1.720 train_accuracy: 0.382 test_accuracy: 0.371\n",
            "[3,   410] train_loss: 1.713 train_accuracy: 0.389 test_accuracy: 0.381\n",
            "[3,   415] train_loss: 1.689 train_accuracy: 0.390 test_accuracy: 0.381\n",
            "[3,   420] train_loss: 1.723 train_accuracy: 0.389 test_accuracy: 0.382\n",
            "[3,   425] train_loss: 1.759 train_accuracy: 0.389 test_accuracy: 0.378\n",
            "[3,   430] train_loss: 1.862 train_accuracy: 0.376 test_accuracy: 0.355\n",
            "[3,   435] train_loss: 1.776 train_accuracy: 0.384 test_accuracy: 0.362\n",
            "[3,   440] train_loss: 1.686 train_accuracy: 0.389 test_accuracy: 0.362\n",
            "[3,   445] train_loss: 1.743 train_accuracy: 0.379 test_accuracy: 0.355\n",
            "[3,   450] train_loss: 1.812 train_accuracy: 0.384 test_accuracy: 0.370\n",
            "[3,   455] train_loss: 1.850 train_accuracy: 0.380 test_accuracy: 0.374\n",
            "[3,   460] train_loss: 1.757 train_accuracy: 0.385 test_accuracy: 0.378\n",
            "[3,   465] train_loss: 1.736 train_accuracy: 0.395 test_accuracy: 0.380\n",
            "[3,   470] train_loss: 1.700 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[3,   475] train_loss: 1.903 train_accuracy: 0.391 test_accuracy: 0.382\n",
            "[3,   480] train_loss: 1.769 train_accuracy: 0.372 test_accuracy: 0.368\n",
            "[3,   485] train_loss: 1.748 train_accuracy: 0.357 test_accuracy: 0.353\n",
            "[3,   490] train_loss: 1.744 train_accuracy: 0.373 test_accuracy: 0.363\n",
            "[3,   495] train_loss: 1.796 train_accuracy: 0.394 test_accuracy: 0.374\n",
            "[3,   500] train_loss: 1.708 train_accuracy: 0.378 test_accuracy: 0.354\n",
            "[3,   505] train_loss: 1.845 train_accuracy: 0.392 test_accuracy: 0.363\n",
            "[3,   510] train_loss: 1.857 train_accuracy: 0.394 test_accuracy: 0.372\n",
            "[3,   515] train_loss: 1.622 train_accuracy: 0.379 test_accuracy: 0.371\n",
            "[3,   520] train_loss: 1.832 train_accuracy: 0.385 test_accuracy: 0.380\n",
            "[3,   525] train_loss: 1.715 train_accuracy: 0.386 test_accuracy: 0.374\n",
            "[3,   530] train_loss: 1.880 train_accuracy: 0.401 test_accuracy: 0.383\n",
            "[3,   535] train_loss: 1.770 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[3,   540] train_loss: 1.815 train_accuracy: 0.386 test_accuracy: 0.373\n",
            "[3,   545] train_loss: 1.826 train_accuracy: 0.376 test_accuracy: 0.365\n",
            "[3,   550] train_loss: 1.981 train_accuracy: 0.390 test_accuracy: 0.377\n",
            "[3,   555] train_loss: 1.756 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[3,   560] train_loss: 1.794 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[3,   565] train_loss: 1.835 train_accuracy: 0.392 test_accuracy: 0.383\n",
            "[3,   570] train_loss: 1.824 train_accuracy: 0.391 test_accuracy: 0.377\n",
            "[3,   575] train_loss: 1.764 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[3,   580] train_loss: 1.802 train_accuracy: 0.391 test_accuracy: 0.373\n",
            "[3,   585] train_loss: 1.722 train_accuracy: 0.393 test_accuracy: 0.379\n",
            "[3,   590] train_loss: 1.701 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[3,   595] train_loss: 1.705 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[3,   600] train_loss: 1.801 train_accuracy: 0.393 test_accuracy: 0.381\n",
            "[3,   605] train_loss: 1.804 train_accuracy: 0.392 test_accuracy: 0.379\n",
            "[3,   610] train_loss: 1.710 train_accuracy: 0.378 test_accuracy: 0.368\n",
            "[3,   615] train_loss: 1.831 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[3,   620] train_loss: 1.809 train_accuracy: 0.388 test_accuracy: 0.373\n",
            "[3,   625] train_loss: 1.794 train_accuracy: 0.392 test_accuracy: 0.370\n",
            "[3,   630] train_loss: 1.717 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[3,   635] train_loss: 1.936 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[3,   640] train_loss: 1.771 train_accuracy: 0.382 test_accuracy: 0.364\n",
            "[3,   645] train_loss: 1.862 train_accuracy: 0.393 test_accuracy: 0.371\n",
            "[3,   650] train_loss: 1.773 train_accuracy: 0.394 test_accuracy: 0.373\n",
            "[3,   655] train_loss: 1.624 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[3,   660] train_loss: 1.708 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[3,   665] train_loss: 1.637 train_accuracy: 0.384 test_accuracy: 0.374\n",
            "[3,   670] train_loss: 1.814 train_accuracy: 0.377 test_accuracy: 0.364\n",
            "[3,   675] train_loss: 1.853 train_accuracy: 0.389 test_accuracy: 0.366\n",
            "[3,   680] train_loss: 1.822 train_accuracy: 0.393 test_accuracy: 0.373\n",
            "[3,   685] train_loss: 1.725 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[3,   690] train_loss: 1.761 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[3,   695] train_loss: 1.824 train_accuracy: 0.392 test_accuracy: 0.371\n",
            "[3,   700] train_loss: 1.822 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,   705] train_loss: 1.803 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[3,   710] train_loss: 1.701 train_accuracy: 0.375 test_accuracy: 0.355\n",
            "[3,   715] train_loss: 1.790 train_accuracy: 0.396 test_accuracy: 0.375\n",
            "[3,   720] train_loss: 1.870 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[3,   725] train_loss: 1.866 train_accuracy: 0.395 test_accuracy: 0.381\n",
            "[3,   730] train_loss: 1.711 train_accuracy: 0.383 test_accuracy: 0.369\n",
            "[3,   735] train_loss: 1.822 train_accuracy: 0.374 test_accuracy: 0.357\n",
            "[3,   740] train_loss: 1.873 train_accuracy: 0.404 test_accuracy: 0.380\n",
            "[3,   745] train_loss: 1.807 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[3,   750] train_loss: 1.772 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[3,   755] train_loss: 1.806 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[3,   760] train_loss: 1.619 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[3,   765] train_loss: 1.705 train_accuracy: 0.382 test_accuracy: 0.366\n",
            "[3,   770] train_loss: 1.715 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[3,   775] train_loss: 1.798 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[3,   780] train_loss: 1.625 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[3,   785] train_loss: 1.849 train_accuracy: 0.392 test_accuracy: 0.377\n",
            "[3,   790] train_loss: 1.716 train_accuracy: 0.402 test_accuracy: 0.375\n",
            "[3,   795] train_loss: 1.719 train_accuracy: 0.402 test_accuracy: 0.375\n",
            "[3,   800] train_loss: 1.815 train_accuracy: 0.391 test_accuracy: 0.370\n",
            "[3,   805] train_loss: 1.905 train_accuracy: 0.391 test_accuracy: 0.367\n",
            "[3,   810] train_loss: 1.738 train_accuracy: 0.382 test_accuracy: 0.364\n",
            "[3,   815] train_loss: 1.686 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[3,   820] train_loss: 1.653 train_accuracy: 0.391 test_accuracy: 0.370\n",
            "[3,   825] train_loss: 1.829 train_accuracy: 0.386 test_accuracy: 0.365\n",
            "[3,   830] train_loss: 1.676 train_accuracy: 0.381 test_accuracy: 0.358\n",
            "[3,   835] train_loss: 1.920 train_accuracy: 0.397 test_accuracy: 0.374\n",
            "[3,   840] train_loss: 1.723 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[3,   845] train_loss: 1.761 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[3,   850] train_loss: 1.803 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[3,   855] train_loss: 1.863 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[3,   860] train_loss: 1.734 train_accuracy: 0.395 test_accuracy: 0.371\n",
            "[3,   865] train_loss: 1.820 train_accuracy: 0.402 test_accuracy: 0.382\n",
            "[3,   870] train_loss: 1.775 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[3,   875] train_loss: 1.732 train_accuracy: 0.391 test_accuracy: 0.369\n",
            "[3,   880] train_loss: 1.825 train_accuracy: 0.391 test_accuracy: 0.367\n",
            "[3,   885] train_loss: 1.748 train_accuracy: 0.391 test_accuracy: 0.371\n",
            "[3,   890] train_loss: 1.768 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,   895] train_loss: 1.853 train_accuracy: 0.385 test_accuracy: 0.375\n",
            "[3,   900] train_loss: 1.842 train_accuracy: 0.379 test_accuracy: 0.363\n",
            "[3,   905] train_loss: 1.829 train_accuracy: 0.381 test_accuracy: 0.367\n",
            "[3,   910] train_loss: 1.822 train_accuracy: 0.383 test_accuracy: 0.366\n",
            "[3,   915] train_loss: 1.949 train_accuracy: 0.373 test_accuracy: 0.359\n",
            "[3,   920] train_loss: 1.719 train_accuracy: 0.380 test_accuracy: 0.364\n",
            "[3,   925] train_loss: 1.820 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[3,   930] train_loss: 1.869 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[3,   935] train_loss: 1.749 train_accuracy: 0.380 test_accuracy: 0.371\n",
            "[3,   940] train_loss: 1.811 train_accuracy: 0.378 test_accuracy: 0.365\n",
            "[3,   945] train_loss: 1.765 train_accuracy: 0.394 test_accuracy: 0.375\n",
            "[3,   950] train_loss: 1.863 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[3,   955] train_loss: 1.738 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[3,   960] train_loss: 1.734 train_accuracy: 0.395 test_accuracy: 0.376\n",
            "[3,   965] train_loss: 1.757 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[3,   970] train_loss: 1.548 train_accuracy: 0.385 test_accuracy: 0.373\n",
            "[3,   975] train_loss: 1.613 train_accuracy: 0.389 test_accuracy: 0.379\n",
            "[3,   980] train_loss: 1.806 train_accuracy: 0.403 test_accuracy: 0.384\n",
            "[3,   985] train_loss: 1.733 train_accuracy: 0.394 test_accuracy: 0.374\n",
            "[3,   990] train_loss: 1.789 train_accuracy: 0.405 test_accuracy: 0.395\n",
            "[3,   995] train_loss: 1.733 train_accuracy: 0.397 test_accuracy: 0.391\n",
            "[3,  1000] train_loss: 1.749 train_accuracy: 0.396 test_accuracy: 0.385\n",
            "[3,  1005] train_loss: 1.678 train_accuracy: 0.386 test_accuracy: 0.366\n",
            "[3,  1010] train_loss: 1.807 train_accuracy: 0.376 test_accuracy: 0.356\n",
            "[3,  1015] train_loss: 1.736 train_accuracy: 0.399 test_accuracy: 0.384\n",
            "[3,  1020] train_loss: 1.808 train_accuracy: 0.400 test_accuracy: 0.387\n",
            "[3,  1025] train_loss: 1.875 train_accuracy: 0.388 test_accuracy: 0.376\n",
            "[3,  1030] train_loss: 1.705 train_accuracy: 0.384 test_accuracy: 0.369\n",
            "[3,  1035] train_loss: 1.708 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[3,  1040] train_loss: 1.784 train_accuracy: 0.398 test_accuracy: 0.380\n",
            "[3,  1045] train_loss: 1.791 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[3,  1050] train_loss: 1.833 train_accuracy: 0.393 test_accuracy: 0.382\n",
            "[3,  1055] train_loss: 1.677 train_accuracy: 0.385 test_accuracy: 0.365\n",
            "[3,  1060] train_loss: 1.827 train_accuracy: 0.379 test_accuracy: 0.367\n",
            "[3,  1065] train_loss: 1.712 train_accuracy: 0.389 test_accuracy: 0.376\n",
            "[3,  1070] train_loss: 1.807 train_accuracy: 0.394 test_accuracy: 0.383\n",
            "[3,  1075] train_loss: 1.726 train_accuracy: 0.376 test_accuracy: 0.367\n",
            "[3,  1080] train_loss: 1.828 train_accuracy: 0.393 test_accuracy: 0.383\n",
            "[3,  1085] train_loss: 1.832 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[3,  1090] train_loss: 1.691 train_accuracy: 0.388 test_accuracy: 0.378\n",
            "[3,  1095] train_loss: 1.745 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[3,  1100] train_loss: 1.693 train_accuracy: 0.395 test_accuracy: 0.376\n",
            "[3,  1105] train_loss: 1.845 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[3,  1110] train_loss: 1.682 train_accuracy: 0.388 test_accuracy: 0.371\n",
            "[3,  1115] train_loss: 1.774 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[3,  1120] train_loss: 1.925 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[3,  1125] train_loss: 1.844 train_accuracy: 0.387 test_accuracy: 0.367\n",
            "[3,  1130] train_loss: 1.860 train_accuracy: 0.382 test_accuracy: 0.364\n",
            "[3,  1135] train_loss: 1.783 train_accuracy: 0.387 test_accuracy: 0.372\n",
            "[3,  1140] train_loss: 1.767 train_accuracy: 0.393 test_accuracy: 0.382\n",
            "[3,  1145] train_loss: 1.724 train_accuracy: 0.390 test_accuracy: 0.376\n",
            "[3,  1150] train_loss: 1.696 train_accuracy: 0.392 test_accuracy: 0.368\n",
            "[3,  1155] train_loss: 1.777 train_accuracy: 0.376 test_accuracy: 0.354\n",
            "[3,  1160] train_loss: 1.763 train_accuracy: 0.387 test_accuracy: 0.361\n",
            "[3,  1165] train_loss: 1.770 train_accuracy: 0.380 test_accuracy: 0.353\n",
            "[3,  1170] train_loss: 1.723 train_accuracy: 0.395 test_accuracy: 0.374\n",
            "[3,  1175] train_loss: 1.821 train_accuracy: 0.386 test_accuracy: 0.371\n",
            "[3,  1180] train_loss: 1.784 train_accuracy: 0.385 test_accuracy: 0.376\n",
            "[3,  1185] train_loss: 1.930 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[3,  1190] train_loss: 1.750 train_accuracy: 0.385 test_accuracy: 0.369\n",
            "[3,  1195] train_loss: 1.802 train_accuracy: 0.398 test_accuracy: 0.379\n",
            "[3,  1200] train_loss: 1.705 train_accuracy: 0.396 test_accuracy: 0.376\n",
            "[3,  1205] train_loss: 1.837 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[3,  1210] train_loss: 1.770 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[3,  1215] train_loss: 1.760 train_accuracy: 0.403 test_accuracy: 0.386\n",
            "[3,  1220] train_loss: 1.745 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[3,  1225] train_loss: 1.826 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[3,  1230] train_loss: 1.901 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[3,  1235] train_loss: 1.795 train_accuracy: 0.387 test_accuracy: 0.365\n",
            "[3,  1240] train_loss: 1.826 train_accuracy: 0.398 test_accuracy: 0.369\n",
            "[3,  1245] train_loss: 1.729 train_accuracy: 0.396 test_accuracy: 0.371\n",
            "[4,     5] train_loss: 1.724 train_accuracy: 0.380 test_accuracy: 0.367\n",
            "[4,    10] train_loss: 1.751 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[4,    15] train_loss: 1.844 train_accuracy: 0.397 test_accuracy: 0.372\n",
            "[4,    20] train_loss: 1.679 train_accuracy: 0.383 test_accuracy: 0.370\n",
            "[4,    25] train_loss: 1.747 train_accuracy: 0.382 test_accuracy: 0.373\n",
            "[4,    30] train_loss: 1.702 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[4,    35] train_loss: 1.676 train_accuracy: 0.388 test_accuracy: 0.370\n",
            "[4,    40] train_loss: 1.652 train_accuracy: 0.384 test_accuracy: 0.366\n",
            "[4,    45] train_loss: 1.701 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[4,    50] train_loss: 1.635 train_accuracy: 0.397 test_accuracy: 0.382\n",
            "[4,    55] train_loss: 1.776 train_accuracy: 0.387 test_accuracy: 0.374\n",
            "[4,    60] train_loss: 1.806 train_accuracy: 0.387 test_accuracy: 0.364\n",
            "[4,    65] train_loss: 1.745 train_accuracy: 0.385 test_accuracy: 0.368\n",
            "[4,    70] train_loss: 1.834 train_accuracy: 0.381 test_accuracy: 0.369\n",
            "[4,    75] train_loss: 1.751 train_accuracy: 0.365 test_accuracy: 0.354\n",
            "[4,    80] train_loss: 1.647 train_accuracy: 0.379 test_accuracy: 0.368\n",
            "[4,    85] train_loss: 1.808 train_accuracy: 0.396 test_accuracy: 0.382\n",
            "[4,    90] train_loss: 1.616 train_accuracy: 0.387 test_accuracy: 0.376\n",
            "[4,    95] train_loss: 1.629 train_accuracy: 0.383 test_accuracy: 0.371\n",
            "[4,   100] train_loss: 1.797 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[4,   105] train_loss: 1.767 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[4,   110] train_loss: 1.831 train_accuracy: 0.406 test_accuracy: 0.381\n",
            "[4,   115] train_loss: 1.760 train_accuracy: 0.402 test_accuracy: 0.381\n",
            "[4,   120] train_loss: 1.632 train_accuracy: 0.401 test_accuracy: 0.386\n",
            "[4,   125] train_loss: 1.629 train_accuracy: 0.393 test_accuracy: 0.382\n",
            "[4,   130] train_loss: 1.718 train_accuracy: 0.397 test_accuracy: 0.383\n",
            "[4,   135] train_loss: 1.804 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[4,   140] train_loss: 1.873 train_accuracy: 0.389 test_accuracy: 0.370\n",
            "[4,   145] train_loss: 1.732 train_accuracy: 0.393 test_accuracy: 0.372\n",
            "[4,   150] train_loss: 1.693 train_accuracy: 0.390 test_accuracy: 0.371\n",
            "[4,   155] train_loss: 1.740 train_accuracy: 0.385 test_accuracy: 0.373\n",
            "[4,   160] train_loss: 1.753 train_accuracy: 0.402 test_accuracy: 0.382\n",
            "[4,   165] train_loss: 1.700 train_accuracy: 0.404 test_accuracy: 0.380\n",
            "[4,   170] train_loss: 1.797 train_accuracy: 0.396 test_accuracy: 0.372\n",
            "[4,   175] train_loss: 1.799 train_accuracy: 0.397 test_accuracy: 0.370\n",
            "[4,   180] train_loss: 1.692 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[4,   185] train_loss: 1.729 train_accuracy: 0.400 test_accuracy: 0.384\n",
            "[4,   190] train_loss: 1.786 train_accuracy: 0.400 test_accuracy: 0.383\n",
            "[4,   195] train_loss: 1.745 train_accuracy: 0.405 test_accuracy: 0.384\n",
            "[4,   200] train_loss: 1.823 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[4,   205] train_loss: 1.731 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[4,   210] train_loss: 1.740 train_accuracy: 0.392 test_accuracy: 0.376\n",
            "[4,   215] train_loss: 1.673 train_accuracy: 0.379 test_accuracy: 0.363\n",
            "[4,   220] train_loss: 1.742 train_accuracy: 0.383 test_accuracy: 0.366\n",
            "[4,   225] train_loss: 1.833 train_accuracy: 0.396 test_accuracy: 0.379\n",
            "[4,   230] train_loss: 1.862 train_accuracy: 0.378 test_accuracy: 0.369\n",
            "[4,   235] train_loss: 1.722 train_accuracy: 0.378 test_accuracy: 0.362\n",
            "[4,   240] train_loss: 1.779 train_accuracy: 0.390 test_accuracy: 0.373\n",
            "[4,   245] train_loss: 1.724 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[4,   250] train_loss: 1.670 train_accuracy: 0.408 test_accuracy: 0.382\n",
            "[4,   255] train_loss: 1.756 train_accuracy: 0.398 test_accuracy: 0.374\n",
            "[4,   260] train_loss: 1.773 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[4,   265] train_loss: 1.683 train_accuracy: 0.404 test_accuracy: 0.375\n",
            "[4,   270] train_loss: 1.909 train_accuracy: 0.410 test_accuracy: 0.382\n",
            "[4,   275] train_loss: 1.821 train_accuracy: 0.407 test_accuracy: 0.378\n",
            "[4,   280] train_loss: 1.620 train_accuracy: 0.406 test_accuracy: 0.378\n",
            "[4,   285] train_loss: 1.682 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[4,   290] train_loss: 1.712 train_accuracy: 0.383 test_accuracy: 0.369\n",
            "[4,   295] train_loss: 1.781 train_accuracy: 0.378 test_accuracy: 0.365\n",
            "[4,   300] train_loss: 1.770 train_accuracy: 0.392 test_accuracy: 0.371\n",
            "[4,   305] train_loss: 1.803 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[4,   310] train_loss: 1.867 train_accuracy: 0.381 test_accuracy: 0.366\n",
            "[4,   315] train_loss: 1.729 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[4,   320] train_loss: 1.777 train_accuracy: 0.398 test_accuracy: 0.375\n",
            "[4,   325] train_loss: 1.852 train_accuracy: 0.395 test_accuracy: 0.371\n",
            "[4,   330] train_loss: 1.646 train_accuracy: 0.395 test_accuracy: 0.377\n",
            "[4,   335] train_loss: 1.754 train_accuracy: 0.404 test_accuracy: 0.379\n",
            "[4,   340] train_loss: 1.710 train_accuracy: 0.408 test_accuracy: 0.383\n",
            "[4,   345] train_loss: 1.711 train_accuracy: 0.408 test_accuracy: 0.386\n",
            "[4,   350] train_loss: 1.801 train_accuracy: 0.402 test_accuracy: 0.381\n",
            "[4,   355] train_loss: 1.827 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[4,   360] train_loss: 1.756 train_accuracy: 0.396 test_accuracy: 0.368\n",
            "[4,   365] train_loss: 1.666 train_accuracy: 0.392 test_accuracy: 0.370\n",
            "[4,   370] train_loss: 1.862 train_accuracy: 0.384 test_accuracy: 0.368\n",
            "[4,   375] train_loss: 1.739 train_accuracy: 0.389 test_accuracy: 0.369\n",
            "[4,   380] train_loss: 1.746 train_accuracy: 0.398 test_accuracy: 0.374\n",
            "[4,   385] train_loss: 1.741 train_accuracy: 0.394 test_accuracy: 0.372\n",
            "[4,   390] train_loss: 1.710 train_accuracy: 0.388 test_accuracy: 0.371\n",
            "[4,   395] train_loss: 1.908 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[4,   400] train_loss: 1.595 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[4,   405] train_loss: 1.855 train_accuracy: 0.391 test_accuracy: 0.371\n",
            "[4,   410] train_loss: 1.835 train_accuracy: 0.407 test_accuracy: 0.385\n",
            "[4,   415] train_loss: 1.656 train_accuracy: 0.407 test_accuracy: 0.382\n",
            "[4,   420] train_loss: 1.747 train_accuracy: 0.394 test_accuracy: 0.378\n",
            "[4,   425] train_loss: 1.803 train_accuracy: 0.392 test_accuracy: 0.377\n",
            "[4,   430] train_loss: 1.769 train_accuracy: 0.399 test_accuracy: 0.383\n",
            "[4,   435] train_loss: 1.630 train_accuracy: 0.402 test_accuracy: 0.383\n",
            "[4,   440] train_loss: 1.693 train_accuracy: 0.396 test_accuracy: 0.374\n",
            "[4,   445] train_loss: 1.870 train_accuracy: 0.395 test_accuracy: 0.371\n",
            "[4,   450] train_loss: 1.740 train_accuracy: 0.383 test_accuracy: 0.363\n",
            "[4,   455] train_loss: 1.828 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[4,   460] train_loss: 1.847 train_accuracy: 0.397 test_accuracy: 0.372\n",
            "[4,   465] train_loss: 1.872 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[4,   470] train_loss: 1.734 train_accuracy: 0.406 test_accuracy: 0.380\n",
            "[4,   475] train_loss: 1.817 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[4,   480] train_loss: 1.762 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[4,   485] train_loss: 1.643 train_accuracy: 0.405 test_accuracy: 0.385\n",
            "[4,   490] train_loss: 1.798 train_accuracy: 0.400 test_accuracy: 0.382\n",
            "[4,   495] train_loss: 1.712 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[4,   500] train_loss: 1.833 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[4,   505] train_loss: 1.787 train_accuracy: 0.400 test_accuracy: 0.379\n",
            "[4,   510] train_loss: 1.676 train_accuracy: 0.396 test_accuracy: 0.381\n",
            "[4,   515] train_loss: 1.855 train_accuracy: 0.396 test_accuracy: 0.383\n",
            "[4,   520] train_loss: 1.837 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[4,   525] train_loss: 1.822 train_accuracy: 0.401 test_accuracy: 0.377\n",
            "[4,   530] train_loss: 1.754 train_accuracy: 0.403 test_accuracy: 0.374\n",
            "[4,   535] train_loss: 1.850 train_accuracy: 0.402 test_accuracy: 0.373\n",
            "[4,   540] train_loss: 1.677 train_accuracy: 0.396 test_accuracy: 0.372\n",
            "[4,   545] train_loss: 1.770 train_accuracy: 0.402 test_accuracy: 0.374\n",
            "[4,   550] train_loss: 1.660 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[4,   555] train_loss: 1.717 train_accuracy: 0.396 test_accuracy: 0.371\n",
            "[4,   560] train_loss: 1.845 train_accuracy: 0.386 test_accuracy: 0.360\n",
            "[4,   565] train_loss: 1.785 train_accuracy: 0.393 test_accuracy: 0.377\n",
            "[4,   570] train_loss: 1.773 train_accuracy: 0.397 test_accuracy: 0.379\n",
            "[4,   575] train_loss: 1.680 train_accuracy: 0.392 test_accuracy: 0.369\n",
            "[4,   580] train_loss: 1.611 train_accuracy: 0.391 test_accuracy: 0.370\n",
            "[4,   585] train_loss: 1.789 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[4,   590] train_loss: 1.709 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[4,   595] train_loss: 1.661 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[4,   600] train_loss: 1.768 train_accuracy: 0.400 test_accuracy: 0.377\n",
            "[4,   605] train_loss: 1.740 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[4,   610] train_loss: 1.733 train_accuracy: 0.396 test_accuracy: 0.369\n",
            "[4,   615] train_loss: 1.814 train_accuracy: 0.399 test_accuracy: 0.374\n",
            "[4,   620] train_loss: 1.860 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[4,   625] train_loss: 1.767 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[4,   630] train_loss: 1.842 train_accuracy: 0.396 test_accuracy: 0.375\n",
            "[4,   635] train_loss: 1.693 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,   640] train_loss: 1.808 train_accuracy: 0.395 test_accuracy: 0.376\n",
            "[4,   645] train_loss: 1.820 train_accuracy: 0.380 test_accuracy: 0.365\n",
            "[4,   650] train_loss: 1.741 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[4,   655] train_loss: 1.726 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[4,   660] train_loss: 1.877 train_accuracy: 0.382 test_accuracy: 0.366\n",
            "[4,   665] train_loss: 1.749 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[4,   670] train_loss: 1.889 train_accuracy: 0.405 test_accuracy: 0.378\n",
            "[4,   675] train_loss: 1.822 train_accuracy: 0.390 test_accuracy: 0.370\n",
            "[4,   680] train_loss: 1.650 train_accuracy: 0.396 test_accuracy: 0.372\n",
            "[4,   685] train_loss: 1.812 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[4,   690] train_loss: 1.813 train_accuracy: 0.402 test_accuracy: 0.377\n",
            "[4,   695] train_loss: 1.827 train_accuracy: 0.403 test_accuracy: 0.385\n",
            "[4,   700] train_loss: 1.670 train_accuracy: 0.396 test_accuracy: 0.385\n",
            "[4,   705] train_loss: 1.848 train_accuracy: 0.388 test_accuracy: 0.381\n",
            "[4,   710] train_loss: 1.824 train_accuracy: 0.381 test_accuracy: 0.371\n",
            "[4,   715] train_loss: 1.738 train_accuracy: 0.394 test_accuracy: 0.375\n",
            "[4,   720] train_loss: 1.737 train_accuracy: 0.395 test_accuracy: 0.367\n",
            "[4,   725] train_loss: 1.790 train_accuracy: 0.401 test_accuracy: 0.372\n",
            "[4,   730] train_loss: 1.750 train_accuracy: 0.397 test_accuracy: 0.370\n",
            "[4,   735] train_loss: 1.767 train_accuracy: 0.401 test_accuracy: 0.374\n",
            "[4,   740] train_loss: 1.603 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[4,   745] train_loss: 1.793 train_accuracy: 0.399 test_accuracy: 0.371\n",
            "[4,   750] train_loss: 1.849 train_accuracy: 0.391 test_accuracy: 0.363\n",
            "[4,   755] train_loss: 1.734 train_accuracy: 0.398 test_accuracy: 0.368\n",
            "[4,   760] train_loss: 1.887 train_accuracy: 0.405 test_accuracy: 0.380\n",
            "[4,   765] train_loss: 1.871 train_accuracy: 0.393 test_accuracy: 0.378\n",
            "[4,   770] train_loss: 1.771 train_accuracy: 0.398 test_accuracy: 0.383\n",
            "[4,   775] train_loss: 1.680 train_accuracy: 0.400 test_accuracy: 0.383\n",
            "[4,   780] train_loss: 1.795 train_accuracy: 0.387 test_accuracy: 0.374\n",
            "[4,   785] train_loss: 1.684 train_accuracy: 0.396 test_accuracy: 0.384\n",
            "[4,   790] train_loss: 1.656 train_accuracy: 0.382 test_accuracy: 0.363\n",
            "[4,   795] train_loss: 1.754 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[4,   800] train_loss: 1.853 train_accuracy: 0.401 test_accuracy: 0.382\n",
            "[4,   805] train_loss: 1.835 train_accuracy: 0.398 test_accuracy: 0.382\n",
            "[4,   810] train_loss: 1.719 train_accuracy: 0.400 test_accuracy: 0.390\n",
            "[4,   815] train_loss: 1.652 train_accuracy: 0.403 test_accuracy: 0.386\n",
            "[4,   820] train_loss: 1.869 train_accuracy: 0.399 test_accuracy: 0.374\n",
            "[4,   825] train_loss: 1.837 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[4,   830] train_loss: 1.659 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[4,   835] train_loss: 1.787 train_accuracy: 0.382 test_accuracy: 0.367\n",
            "[4,   840] train_loss: 1.839 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,   845] train_loss: 1.738 train_accuracy: 0.392 test_accuracy: 0.381\n",
            "[4,   850] train_loss: 1.776 train_accuracy: 0.406 test_accuracy: 0.381\n",
            "[4,   855] train_loss: 1.715 train_accuracy: 0.392 test_accuracy: 0.366\n",
            "[4,   860] train_loss: 1.883 train_accuracy: 0.402 test_accuracy: 0.376\n",
            "[4,   865] train_loss: 1.845 train_accuracy: 0.390 test_accuracy: 0.369\n",
            "[4,   870] train_loss: 1.745 train_accuracy: 0.391 test_accuracy: 0.363\n",
            "[4,   875] train_loss: 1.696 train_accuracy: 0.394 test_accuracy: 0.373\n",
            "[4,   880] train_loss: 1.840 train_accuracy: 0.382 test_accuracy: 0.366\n",
            "[4,   885] train_loss: 1.738 train_accuracy: 0.380 test_accuracy: 0.370\n",
            "[4,   890] train_loss: 1.775 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[4,   895] train_loss: 1.750 train_accuracy: 0.403 test_accuracy: 0.386\n",
            "[4,   900] train_loss: 1.866 train_accuracy: 0.392 test_accuracy: 0.379\n",
            "[4,   905] train_loss: 1.698 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[4,   910] train_loss: 1.736 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[4,   915] train_loss: 1.718 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[4,   920] train_loss: 1.733 train_accuracy: 0.383 test_accuracy: 0.374\n",
            "[4,   925] train_loss: 1.667 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[4,   930] train_loss: 1.883 train_accuracy: 0.405 test_accuracy: 0.384\n",
            "[4,   935] train_loss: 1.725 train_accuracy: 0.405 test_accuracy: 0.389\n",
            "[4,   940] train_loss: 1.704 train_accuracy: 0.412 test_accuracy: 0.395\n",
            "[4,   945] train_loss: 1.760 train_accuracy: 0.409 test_accuracy: 0.390\n",
            "[4,   950] train_loss: 1.819 train_accuracy: 0.403 test_accuracy: 0.379\n",
            "[4,   955] train_loss: 1.760 train_accuracy: 0.399 test_accuracy: 0.377\n",
            "[4,   960] train_loss: 1.666 train_accuracy: 0.406 test_accuracy: 0.375\n",
            "[4,   965] train_loss: 1.704 train_accuracy: 0.405 test_accuracy: 0.380\n",
            "[4,   970] train_loss: 1.814 train_accuracy: 0.401 test_accuracy: 0.375\n",
            "[4,   975] train_loss: 1.727 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[4,   980] train_loss: 1.905 train_accuracy: 0.395 test_accuracy: 0.376\n",
            "[4,   985] train_loss: 1.797 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[4,   990] train_loss: 1.717 train_accuracy: 0.379 test_accuracy: 0.364\n",
            "[4,   995] train_loss: 1.787 train_accuracy: 0.389 test_accuracy: 0.372\n",
            "[4,  1000] train_loss: 1.845 train_accuracy: 0.393 test_accuracy: 0.375\n",
            "[4,  1005] train_loss: 1.809 train_accuracy: 0.381 test_accuracy: 0.365\n",
            "[4,  1010] train_loss: 1.706 train_accuracy: 0.378 test_accuracy: 0.367\n",
            "[4,  1015] train_loss: 1.731 train_accuracy: 0.387 test_accuracy: 0.371\n",
            "[4,  1020] train_loss: 1.647 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,  1025] train_loss: 1.746 train_accuracy: 0.392 test_accuracy: 0.374\n",
            "[4,  1030] train_loss: 1.772 train_accuracy: 0.399 test_accuracy: 0.382\n",
            "[4,  1035] train_loss: 1.732 train_accuracy: 0.400 test_accuracy: 0.387\n",
            "[4,  1040] train_loss: 1.786 train_accuracy: 0.399 test_accuracy: 0.384\n",
            "[4,  1045] train_loss: 1.742 train_accuracy: 0.398 test_accuracy: 0.382\n",
            "[4,  1050] train_loss: 1.778 train_accuracy: 0.398 test_accuracy: 0.378\n",
            "[4,  1055] train_loss: 1.741 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[4,  1060] train_loss: 1.793 train_accuracy: 0.384 test_accuracy: 0.372\n",
            "[4,  1065] train_loss: 1.760 train_accuracy: 0.397 test_accuracy: 0.381\n",
            "[4,  1070] train_loss: 1.758 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[4,  1075] train_loss: 1.739 train_accuracy: 0.393 test_accuracy: 0.380\n",
            "[4,  1080] train_loss: 1.674 train_accuracy: 0.401 test_accuracy: 0.384\n",
            "[4,  1085] train_loss: 1.711 train_accuracy: 0.418 test_accuracy: 0.390\n",
            "[4,  1090] train_loss: 1.680 train_accuracy: 0.401 test_accuracy: 0.383\n",
            "[4,  1095] train_loss: 1.804 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[4,  1100] train_loss: 1.734 train_accuracy: 0.403 test_accuracy: 0.386\n",
            "[4,  1105] train_loss: 1.782 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[4,  1110] train_loss: 1.838 train_accuracy: 0.376 test_accuracy: 0.355\n",
            "[4,  1115] train_loss: 1.922 train_accuracy: 0.389 test_accuracy: 0.372\n",
            "[4,  1120] train_loss: 1.773 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[4,  1125] train_loss: 1.776 train_accuracy: 0.393 test_accuracy: 0.376\n",
            "[4,  1130] train_loss: 1.681 train_accuracy: 0.387 test_accuracy: 0.374\n",
            "[4,  1135] train_loss: 1.770 train_accuracy: 0.394 test_accuracy: 0.380\n",
            "[4,  1140] train_loss: 1.689 train_accuracy: 0.393 test_accuracy: 0.374\n",
            "[4,  1145] train_loss: 1.830 train_accuracy: 0.380 test_accuracy: 0.364\n",
            "[4,  1150] train_loss: 1.804 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[4,  1155] train_loss: 1.730 train_accuracy: 0.399 test_accuracy: 0.379\n",
            "[4,  1160] train_loss: 1.858 train_accuracy: 0.398 test_accuracy: 0.382\n",
            "[4,  1165] train_loss: 1.735 train_accuracy: 0.402 test_accuracy: 0.381\n",
            "[4,  1170] train_loss: 1.851 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[4,  1175] train_loss: 1.776 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[4,  1180] train_loss: 1.695 train_accuracy: 0.405 test_accuracy: 0.382\n",
            "[4,  1185] train_loss: 1.716 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[4,  1190] train_loss: 1.694 train_accuracy: 0.398 test_accuracy: 0.373\n",
            "[4,  1195] train_loss: 1.842 train_accuracy: 0.399 test_accuracy: 0.371\n",
            "[4,  1200] train_loss: 1.828 train_accuracy: 0.394 test_accuracy: 0.372\n",
            "[4,  1205] train_loss: 1.711 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[4,  1210] train_loss: 1.724 train_accuracy: 0.408 test_accuracy: 0.392\n",
            "[4,  1215] train_loss: 1.773 train_accuracy: 0.404 test_accuracy: 0.387\n",
            "[4,  1220] train_loss: 1.827 train_accuracy: 0.404 test_accuracy: 0.386\n",
            "[4,  1225] train_loss: 1.801 train_accuracy: 0.400 test_accuracy: 0.386\n",
            "[4,  1230] train_loss: 1.783 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[4,  1235] train_loss: 1.671 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[4,  1240] train_loss: 1.831 train_accuracy: 0.386 test_accuracy: 0.370\n",
            "[4,  1245] train_loss: 1.784 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[5,     5] train_loss: 1.836 train_accuracy: 0.392 test_accuracy: 0.369\n",
            "[5,    10] train_loss: 1.833 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[5,    15] train_loss: 1.741 train_accuracy: 0.397 test_accuracy: 0.378\n",
            "[5,    20] train_loss: 1.743 train_accuracy: 0.412 test_accuracy: 0.392\n",
            "[5,    25] train_loss: 1.645 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[5,    30] train_loss: 1.896 train_accuracy: 0.395 test_accuracy: 0.379\n",
            "[5,    35] train_loss: 1.730 train_accuracy: 0.395 test_accuracy: 0.375\n",
            "[5,    40] train_loss: 1.714 train_accuracy: 0.400 test_accuracy: 0.379\n",
            "[5,    45] train_loss: 1.787 train_accuracy: 0.401 test_accuracy: 0.376\n",
            "[5,    50] train_loss: 1.647 train_accuracy: 0.399 test_accuracy: 0.376\n",
            "[5,    55] train_loss: 1.767 train_accuracy: 0.408 test_accuracy: 0.383\n",
            "[5,    60] train_loss: 1.830 train_accuracy: 0.409 test_accuracy: 0.386\n",
            "[5,    65] train_loss: 1.659 train_accuracy: 0.415 test_accuracy: 0.389\n",
            "[5,    70] train_loss: 1.736 train_accuracy: 0.410 test_accuracy: 0.387\n",
            "[5,    75] train_loss: 1.694 train_accuracy: 0.406 test_accuracy: 0.383\n",
            "[5,    80] train_loss: 1.755 train_accuracy: 0.411 test_accuracy: 0.388\n",
            "[5,    85] train_loss: 1.684 train_accuracy: 0.402 test_accuracy: 0.387\n",
            "[5,    90] train_loss: 1.687 train_accuracy: 0.390 test_accuracy: 0.379\n",
            "[5,    95] train_loss: 1.668 train_accuracy: 0.392 test_accuracy: 0.379\n",
            "[5,   100] train_loss: 1.726 train_accuracy: 0.387 test_accuracy: 0.370\n",
            "[5,   105] train_loss: 1.754 train_accuracy: 0.389 test_accuracy: 0.373\n",
            "[5,   110] train_loss: 1.840 train_accuracy: 0.394 test_accuracy: 0.375\n",
            "[5,   115] train_loss: 1.646 train_accuracy: 0.394 test_accuracy: 0.375\n",
            "[5,   120] train_loss: 1.844 train_accuracy: 0.394 test_accuracy: 0.376\n",
            "[5,   125] train_loss: 1.733 train_accuracy: 0.401 test_accuracy: 0.377\n",
            "[5,   130] train_loss: 1.716 train_accuracy: 0.397 test_accuracy: 0.371\n",
            "[5,   135] train_loss: 1.740 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[5,   140] train_loss: 1.722 train_accuracy: 0.400 test_accuracy: 0.377\n",
            "[5,   145] train_loss: 1.878 train_accuracy: 0.402 test_accuracy: 0.374\n",
            "[5,   150] train_loss: 1.737 train_accuracy: 0.408 test_accuracy: 0.376\n",
            "[5,   155] train_loss: 1.745 train_accuracy: 0.407 test_accuracy: 0.383\n",
            "[5,   160] train_loss: 1.725 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[5,   165] train_loss: 1.745 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   170] train_loss: 1.758 train_accuracy: 0.402 test_accuracy: 0.383\n",
            "[5,   175] train_loss: 1.814 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[5,   180] train_loss: 1.704 train_accuracy: 0.392 test_accuracy: 0.374\n",
            "[5,   185] train_loss: 1.799 train_accuracy: 0.379 test_accuracy: 0.364\n",
            "[5,   190] train_loss: 1.711 train_accuracy: 0.387 test_accuracy: 0.375\n",
            "[5,   195] train_loss: 1.757 train_accuracy: 0.402 test_accuracy: 0.386\n",
            "[5,   200] train_loss: 1.645 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   205] train_loss: 1.848 train_accuracy: 0.396 test_accuracy: 0.383\n",
            "[5,   210] train_loss: 1.726 train_accuracy: 0.397 test_accuracy: 0.381\n",
            "[5,   215] train_loss: 1.821 train_accuracy: 0.390 test_accuracy: 0.376\n",
            "[5,   220] train_loss: 1.813 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[5,   225] train_loss: 1.833 train_accuracy: 0.398 test_accuracy: 0.373\n",
            "[5,   230] train_loss: 1.824 train_accuracy: 0.390 test_accuracy: 0.374\n",
            "[5,   235] train_loss: 1.856 train_accuracy: 0.388 test_accuracy: 0.369\n",
            "[5,   240] train_loss: 1.653 train_accuracy: 0.389 test_accuracy: 0.371\n",
            "[5,   245] train_loss: 1.726 train_accuracy: 0.387 test_accuracy: 0.367\n",
            "[5,   250] train_loss: 1.760 train_accuracy: 0.389 test_accuracy: 0.374\n",
            "[5,   255] train_loss: 1.706 train_accuracy: 0.398 test_accuracy: 0.388\n",
            "[5,   260] train_loss: 1.825 train_accuracy: 0.399 test_accuracy: 0.387\n",
            "[5,   265] train_loss: 1.706 train_accuracy: 0.407 test_accuracy: 0.389\n",
            "[5,   270] train_loss: 1.645 train_accuracy: 0.405 test_accuracy: 0.388\n",
            "[5,   275] train_loss: 1.737 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[5,   280] train_loss: 1.772 train_accuracy: 0.392 test_accuracy: 0.374\n",
            "[5,   285] train_loss: 1.831 train_accuracy: 0.397 test_accuracy: 0.380\n",
            "[5,   290] train_loss: 1.838 train_accuracy: 0.412 test_accuracy: 0.383\n",
            "[5,   295] train_loss: 1.724 train_accuracy: 0.403 test_accuracy: 0.379\n",
            "[5,   300] train_loss: 1.711 train_accuracy: 0.407 test_accuracy: 0.380\n",
            "[5,   305] train_loss: 1.784 train_accuracy: 0.398 test_accuracy: 0.381\n",
            "[5,   310] train_loss: 1.739 train_accuracy: 0.393 test_accuracy: 0.382\n",
            "[5,   315] train_loss: 1.730 train_accuracy: 0.388 test_accuracy: 0.377\n",
            "[5,   320] train_loss: 1.756 train_accuracy: 0.406 test_accuracy: 0.389\n",
            "[5,   325] train_loss: 1.703 train_accuracy: 0.407 test_accuracy: 0.390\n",
            "[5,   330] train_loss: 1.618 train_accuracy: 0.399 test_accuracy: 0.381\n",
            "[5,   335] train_loss: 1.838 train_accuracy: 0.396 test_accuracy: 0.377\n",
            "[5,   340] train_loss: 1.758 train_accuracy: 0.410 test_accuracy: 0.388\n",
            "[5,   345] train_loss: 1.739 train_accuracy: 0.408 test_accuracy: 0.387\n",
            "[5,   350] train_loss: 1.715 train_accuracy: 0.411 test_accuracy: 0.391\n",
            "[5,   355] train_loss: 1.810 train_accuracy: 0.418 test_accuracy: 0.398\n",
            "[5,   360] train_loss: 1.575 train_accuracy: 0.413 test_accuracy: 0.388\n",
            "[5,   365] train_loss: 1.737 train_accuracy: 0.408 test_accuracy: 0.382\n",
            "[5,   370] train_loss: 1.739 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[5,   375] train_loss: 1.822 train_accuracy: 0.411 test_accuracy: 0.389\n",
            "[5,   380] train_loss: 1.732 train_accuracy: 0.411 test_accuracy: 0.386\n",
            "[5,   385] train_loss: 1.792 train_accuracy: 0.410 test_accuracy: 0.391\n",
            "[5,   390] train_loss: 1.684 train_accuracy: 0.406 test_accuracy: 0.391\n",
            "[5,   395] train_loss: 1.769 train_accuracy: 0.395 test_accuracy: 0.383\n",
            "[5,   400] train_loss: 1.701 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[5,   405] train_loss: 1.673 train_accuracy: 0.404 test_accuracy: 0.381\n",
            "[5,   410] train_loss: 1.747 train_accuracy: 0.410 test_accuracy: 0.389\n",
            "[5,   415] train_loss: 1.632 train_accuracy: 0.415 test_accuracy: 0.398\n",
            "[5,   420] train_loss: 1.778 train_accuracy: 0.424 test_accuracy: 0.398\n",
            "[5,   425] train_loss: 1.789 train_accuracy: 0.419 test_accuracy: 0.393\n",
            "[5,   430] train_loss: 1.903 train_accuracy: 0.403 test_accuracy: 0.386\n",
            "[5,   435] train_loss: 1.791 train_accuracy: 0.398 test_accuracy: 0.383\n",
            "[5,   440] train_loss: 1.726 train_accuracy: 0.390 test_accuracy: 0.375\n",
            "[5,   445] train_loss: 1.702 train_accuracy: 0.391 test_accuracy: 0.374\n",
            "[5,   450] train_loss: 1.661 train_accuracy: 0.397 test_accuracy: 0.375\n",
            "[5,   455] train_loss: 1.818 train_accuracy: 0.407 test_accuracy: 0.387\n",
            "[5,   460] train_loss: 1.821 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[5,   465] train_loss: 1.626 train_accuracy: 0.409 test_accuracy: 0.391\n",
            "[5,   470] train_loss: 1.751 train_accuracy: 0.411 test_accuracy: 0.389\n",
            "[5,   475] train_loss: 1.745 train_accuracy: 0.403 test_accuracy: 0.389\n",
            "[5,   480] train_loss: 1.717 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[5,   485] train_loss: 1.690 train_accuracy: 0.387 test_accuracy: 0.372\n",
            "[5,   490] train_loss: 1.668 train_accuracy: 0.393 test_accuracy: 0.375\n",
            "[5,   495] train_loss: 1.836 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[5,   500] train_loss: 1.722 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[5,   505] train_loss: 1.630 train_accuracy: 0.390 test_accuracy: 0.372\n",
            "[5,   510] train_loss: 1.812 train_accuracy: 0.388 test_accuracy: 0.374\n",
            "[5,   515] train_loss: 1.708 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,   520] train_loss: 1.758 train_accuracy: 0.406 test_accuracy: 0.390\n",
            "[5,   525] train_loss: 1.759 train_accuracy: 0.411 test_accuracy: 0.382\n",
            "[5,   530] train_loss: 1.779 train_accuracy: 0.411 test_accuracy: 0.386\n",
            "[5,   535] train_loss: 1.856 train_accuracy: 0.398 test_accuracy: 0.377\n",
            "[5,   540] train_loss: 1.752 train_accuracy: 0.412 test_accuracy: 0.381\n",
            "[5,   545] train_loss: 1.794 train_accuracy: 0.406 test_accuracy: 0.379\n",
            "[5,   550] train_loss: 1.901 train_accuracy: 0.408 test_accuracy: 0.385\n",
            "[5,   555] train_loss: 1.767 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,   560] train_loss: 1.768 train_accuracy: 0.399 test_accuracy: 0.378\n",
            "[5,   565] train_loss: 1.706 train_accuracy: 0.398 test_accuracy: 0.378\n",
            "[5,   570] train_loss: 1.739 train_accuracy: 0.401 test_accuracy: 0.388\n",
            "[5,   575] train_loss: 1.771 train_accuracy: 0.406 test_accuracy: 0.384\n",
            "[5,   580] train_loss: 1.658 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   585] train_loss: 1.764 train_accuracy: 0.408 test_accuracy: 0.387\n",
            "[5,   590] train_loss: 1.701 train_accuracy: 0.407 test_accuracy: 0.382\n",
            "[5,   595] train_loss: 1.678 train_accuracy: 0.403 test_accuracy: 0.376\n",
            "[5,   600] train_loss: 1.834 train_accuracy: 0.399 test_accuracy: 0.375\n",
            "[5,   605] train_loss: 1.811 train_accuracy: 0.404 test_accuracy: 0.380\n",
            "[5,   610] train_loss: 1.823 train_accuracy: 0.406 test_accuracy: 0.383\n",
            "[5,   615] train_loss: 1.749 train_accuracy: 0.406 test_accuracy: 0.388\n",
            "[5,   620] train_loss: 1.785 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[5,   625] train_loss: 1.822 train_accuracy: 0.381 test_accuracy: 0.367\n",
            "[5,   630] train_loss: 1.652 train_accuracy: 0.394 test_accuracy: 0.374\n",
            "[5,   635] train_loss: 1.898 train_accuracy: 0.408 test_accuracy: 0.384\n",
            "[5,   640] train_loss: 1.722 train_accuracy: 0.400 test_accuracy: 0.380\n",
            "[5,   645] train_loss: 1.626 train_accuracy: 0.392 test_accuracy: 0.372\n",
            "[5,   650] train_loss: 1.784 train_accuracy: 0.392 test_accuracy: 0.373\n",
            "[5,   655] train_loss: 1.794 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[5,   660] train_loss: 1.709 train_accuracy: 0.400 test_accuracy: 0.377\n",
            "[5,   665] train_loss: 1.596 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[5,   670] train_loss: 1.801 train_accuracy: 0.382 test_accuracy: 0.355\n",
            "[5,   675] train_loss: 1.851 train_accuracy: 0.401 test_accuracy: 0.381\n",
            "[5,   680] train_loss: 1.700 train_accuracy: 0.385 test_accuracy: 0.374\n",
            "[5,   685] train_loss: 1.584 train_accuracy: 0.391 test_accuracy: 0.375\n",
            "[5,   690] train_loss: 1.934 train_accuracy: 0.386 test_accuracy: 0.372\n",
            "[5,   695] train_loss: 1.706 train_accuracy: 0.398 test_accuracy: 0.378\n",
            "[5,   700] train_loss: 1.806 train_accuracy: 0.413 test_accuracy: 0.391\n",
            "[5,   705] train_loss: 1.733 train_accuracy: 0.409 test_accuracy: 0.390\n",
            "[5,   710] train_loss: 1.721 train_accuracy: 0.408 test_accuracy: 0.389\n",
            "[5,   715] train_loss: 1.634 train_accuracy: 0.408 test_accuracy: 0.392\n",
            "[5,   720] train_loss: 1.819 train_accuracy: 0.399 test_accuracy: 0.383\n",
            "[5,   725] train_loss: 1.800 train_accuracy: 0.380 test_accuracy: 0.369\n",
            "[5,   730] train_loss: 1.717 train_accuracy: 0.392 test_accuracy: 0.375\n",
            "[5,   735] train_loss: 1.835 train_accuracy: 0.397 test_accuracy: 0.377\n",
            "[5,   740] train_loss: 1.731 train_accuracy: 0.394 test_accuracy: 0.379\n",
            "[5,   745] train_loss: 1.769 train_accuracy: 0.401 test_accuracy: 0.378\n",
            "[5,   750] train_loss: 1.852 train_accuracy: 0.404 test_accuracy: 0.377\n",
            "[5,   755] train_loss: 1.769 train_accuracy: 0.388 test_accuracy: 0.365\n",
            "[5,   760] train_loss: 1.761 train_accuracy: 0.385 test_accuracy: 0.365\n",
            "[5,   765] train_loss: 1.591 train_accuracy: 0.406 test_accuracy: 0.382\n",
            "[5,   770] train_loss: 1.722 train_accuracy: 0.406 test_accuracy: 0.387\n",
            "[5,   775] train_loss: 1.610 train_accuracy: 0.406 test_accuracy: 0.389\n",
            "[5,   780] train_loss: 1.781 train_accuracy: 0.410 test_accuracy: 0.388\n",
            "[5,   785] train_loss: 1.720 train_accuracy: 0.402 test_accuracy: 0.378\n",
            "[5,   790] train_loss: 1.752 train_accuracy: 0.396 test_accuracy: 0.378\n",
            "[5,   795] train_loss: 1.859 train_accuracy: 0.412 test_accuracy: 0.392\n",
            "[5,   800] train_loss: 1.678 train_accuracy: 0.388 test_accuracy: 0.377\n",
            "[5,   805] train_loss: 1.685 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[5,   810] train_loss: 1.651 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[5,   815] train_loss: 1.751 train_accuracy: 0.399 test_accuracy: 0.383\n",
            "[5,   820] train_loss: 1.746 train_accuracy: 0.398 test_accuracy: 0.382\n",
            "[5,   825] train_loss: 1.807 train_accuracy: 0.405 test_accuracy: 0.385\n",
            "[5,   830] train_loss: 1.583 train_accuracy: 0.401 test_accuracy: 0.386\n",
            "[5,   835] train_loss: 1.905 train_accuracy: 0.391 test_accuracy: 0.366\n",
            "[5,   840] train_loss: 1.872 train_accuracy: 0.400 test_accuracy: 0.378\n",
            "[5,   845] train_loss: 1.738 train_accuracy: 0.406 test_accuracy: 0.374\n",
            "[5,   850] train_loss: 1.690 train_accuracy: 0.405 test_accuracy: 0.376\n",
            "[5,   855] train_loss: 1.755 train_accuracy: 0.402 test_accuracy: 0.374\n",
            "[5,   860] train_loss: 1.770 train_accuracy: 0.398 test_accuracy: 0.376\n",
            "[5,   865] train_loss: 1.838 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   870] train_loss: 1.972 train_accuracy: 0.397 test_accuracy: 0.371\n",
            "[5,   875] train_loss: 1.744 train_accuracy: 0.397 test_accuracy: 0.373\n",
            "[5,   880] train_loss: 1.681 train_accuracy: 0.406 test_accuracy: 0.386\n",
            "[5,   885] train_loss: 1.838 train_accuracy: 0.405 test_accuracy: 0.387\n",
            "[5,   890] train_loss: 1.763 train_accuracy: 0.410 test_accuracy: 0.388\n",
            "[5,   895] train_loss: 1.650 train_accuracy: 0.400 test_accuracy: 0.381\n",
            "[5,   900] train_loss: 1.793 train_accuracy: 0.406 test_accuracy: 0.385\n",
            "[5,   905] train_loss: 1.768 train_accuracy: 0.409 test_accuracy: 0.388\n",
            "[5,   910] train_loss: 1.943 train_accuracy: 0.403 test_accuracy: 0.377\n",
            "[5,   915] train_loss: 1.742 train_accuracy: 0.402 test_accuracy: 0.379\n",
            "[5,   920] train_loss: 1.743 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   925] train_loss: 1.744 train_accuracy: 0.407 test_accuracy: 0.389\n",
            "[5,   930] train_loss: 1.738 train_accuracy: 0.410 test_accuracy: 0.387\n",
            "[5,   935] train_loss: 1.881 train_accuracy: 0.410 test_accuracy: 0.385\n",
            "[5,   940] train_loss: 1.807 train_accuracy: 0.404 test_accuracy: 0.379\n",
            "[5,   945] train_loss: 1.855 train_accuracy: 0.399 test_accuracy: 0.371\n",
            "[5,   950] train_loss: 1.782 train_accuracy: 0.413 test_accuracy: 0.387\n",
            "[5,   955] train_loss: 1.780 train_accuracy: 0.413 test_accuracy: 0.389\n",
            "[5,   960] train_loss: 1.806 train_accuracy: 0.410 test_accuracy: 0.391\n",
            "[5,   965] train_loss: 1.691 train_accuracy: 0.412 test_accuracy: 0.391\n",
            "[5,   970] train_loss: 1.830 train_accuracy: 0.420 test_accuracy: 0.395\n",
            "[5,   975] train_loss: 1.714 train_accuracy: 0.411 test_accuracy: 0.395\n",
            "[5,   980] train_loss: 1.586 train_accuracy: 0.403 test_accuracy: 0.382\n",
            "[5,   985] train_loss: 1.815 train_accuracy: 0.409 test_accuracy: 0.389\n",
            "[5,   990] train_loss: 1.678 train_accuracy: 0.413 test_accuracy: 0.387\n",
            "[5,   995] train_loss: 1.642 train_accuracy: 0.414 test_accuracy: 0.393\n",
            "[5,  1000] train_loss: 1.709 train_accuracy: 0.412 test_accuracy: 0.387\n",
            "[5,  1005] train_loss: 1.836 train_accuracy: 0.403 test_accuracy: 0.376\n",
            "[5,  1010] train_loss: 1.753 train_accuracy: 0.403 test_accuracy: 0.378\n",
            "[5,  1015] train_loss: 1.722 train_accuracy: 0.408 test_accuracy: 0.379\n",
            "[5,  1020] train_loss: 1.747 train_accuracy: 0.413 test_accuracy: 0.387\n",
            "[5,  1025] train_loss: 1.798 train_accuracy: 0.408 test_accuracy: 0.384\n",
            "[5,  1030] train_loss: 1.798 train_accuracy: 0.405 test_accuracy: 0.378\n",
            "[5,  1035] train_loss: 1.800 train_accuracy: 0.410 test_accuracy: 0.382\n",
            "[5,  1040] train_loss: 1.693 train_accuracy: 0.395 test_accuracy: 0.374\n",
            "[5,  1045] train_loss: 1.684 train_accuracy: 0.388 test_accuracy: 0.371\n",
            "[5,  1050] train_loss: 1.600 train_accuracy: 0.400 test_accuracy: 0.376\n",
            "[5,  1055] train_loss: 1.831 train_accuracy: 0.404 test_accuracy: 0.378\n",
            "[5,  1060] train_loss: 1.719 train_accuracy: 0.418 test_accuracy: 0.395\n",
            "[5,  1065] train_loss: 1.743 train_accuracy: 0.412 test_accuracy: 0.391\n",
            "[5,  1070] train_loss: 1.902 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[5,  1075] train_loss: 1.648 train_accuracy: 0.410 test_accuracy: 0.384\n",
            "[5,  1080] train_loss: 1.775 train_accuracy: 0.406 test_accuracy: 0.376\n",
            "[5,  1085] train_loss: 1.683 train_accuracy: 0.409 test_accuracy: 0.382\n",
            "[5,  1090] train_loss: 1.713 train_accuracy: 0.402 test_accuracy: 0.380\n",
            "[5,  1095] train_loss: 1.718 train_accuracy: 0.401 test_accuracy: 0.378\n",
            "[5,  1100] train_loss: 1.667 train_accuracy: 0.415 test_accuracy: 0.387\n",
            "[5,  1105] train_loss: 1.807 train_accuracy: 0.401 test_accuracy: 0.379\n",
            "[5,  1110] train_loss: 1.723 train_accuracy: 0.400 test_accuracy: 0.377\n",
            "[5,  1115] train_loss: 1.732 train_accuracy: 0.401 test_accuracy: 0.374\n",
            "[5,  1120] train_loss: 1.759 train_accuracy: 0.401 test_accuracy: 0.372\n",
            "[5,  1125] train_loss: 1.823 train_accuracy: 0.405 test_accuracy: 0.381\n",
            "[5,  1130] train_loss: 1.771 train_accuracy: 0.407 test_accuracy: 0.385\n",
            "[5,  1135] train_loss: 1.665 train_accuracy: 0.391 test_accuracy: 0.376\n",
            "[5,  1140] train_loss: 1.703 train_accuracy: 0.386 test_accuracy: 0.369\n",
            "[5,  1145] train_loss: 1.812 train_accuracy: 0.404 test_accuracy: 0.384\n",
            "[5,  1150] train_loss: 1.701 train_accuracy: 0.401 test_accuracy: 0.387\n",
            "[5,  1155] train_loss: 1.792 train_accuracy: 0.387 test_accuracy: 0.376\n",
            "[5,  1160] train_loss: 1.725 train_accuracy: 0.397 test_accuracy: 0.381\n",
            "[5,  1165] train_loss: 1.782 train_accuracy: 0.401 test_accuracy: 0.380\n",
            "[5,  1170] train_loss: 1.726 train_accuracy: 0.402 test_accuracy: 0.384\n",
            "[5,  1175] train_loss: 1.686 train_accuracy: 0.382 test_accuracy: 0.370\n",
            "[5,  1180] train_loss: 1.732 train_accuracy: 0.381 test_accuracy: 0.365\n",
            "[5,  1185] train_loss: 1.767 train_accuracy: 0.390 test_accuracy: 0.365\n",
            "[5,  1190] train_loss: 1.725 train_accuracy: 0.399 test_accuracy: 0.371\n",
            "[5,  1195] train_loss: 1.938 train_accuracy: 0.408 test_accuracy: 0.382\n",
            "[5,  1200] train_loss: 1.548 train_accuracy: 0.409 test_accuracy: 0.383\n",
            "[5,  1205] train_loss: 1.700 train_accuracy: 0.411 test_accuracy: 0.388\n",
            "[5,  1210] train_loss: 1.668 train_accuracy: 0.407 test_accuracy: 0.394\n",
            "[5,  1215] train_loss: 1.778 train_accuracy: 0.408 test_accuracy: 0.386\n",
            "[5,  1220] train_loss: 1.670 train_accuracy: 0.406 test_accuracy: 0.382\n",
            "[5,  1225] train_loss: 1.673 train_accuracy: 0.411 test_accuracy: 0.380\n",
            "[5,  1230] train_loss: 1.697 train_accuracy: 0.404 test_accuracy: 0.380\n",
            "[5,  1235] train_loss: 1.716 train_accuracy: 0.402 test_accuracy: 0.379\n",
            "[5,  1240] train_loss: 1.623 train_accuracy: 0.406 test_accuracy: 0.380\n",
            "[5,  1245] train_loss: 1.664 train_accuracy: 0.398 test_accuracy: 0.374\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "# Writing training accuracy to file\n",
        "with open('Accuracy_a_train.txt', 'w') as file:\n",
        "    for i in range(len(a_train)):\n",
        "        file.write(str(a_train[i]))\n",
        "        if i < len(a_train) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing test accuracy to file\n",
        "with open('Accuracy_a_test.txt', 'w') as file:\n",
        "    for i in range(len(a_test)):\n",
        "        file.write(str(a_test[i]))\n",
        "        if i < len(a_test) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing loss values to file\n",
        "with open('Accuracy_loss.txt', 'w') as file:\n",
        "    for i in range(len(lossaaa)):\n",
        "        file.write(str(lossaaa[i]))\n",
        "        if i < len(lossaaa) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "TltKDL6qZGN5"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Convert tensors to lists\n",
        "Inf_list = [tensor.item() for tensor in Inf]\n",
        "Var_av_list = [tensor.item() for tensor in Var_all]\n",
        "Generalization_Ratio_list = [tensor.item() for tensor in Generalization_Ratio_]\n",
        "\n",
        "# Writing Inf_list to file\n",
        "with open('Inf_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Inf_list)):\n",
        "        file.write(str(Inf_list[i]))\n",
        "        if i < len(Inf_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Var_av_list to file\n",
        "with open('Var_all_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Var_av_list)):\n",
        "        file.write(str(Var_av_list[i]))\n",
        "        if i < len(Var_av_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Generalization_Ratio_list to file\n",
        "with open('Generalization_Ratio_list.txt', 'w') as file:\n",
        "    for i in range(len(Generalization_Ratio_list)):\n",
        "        file.write(str(Generalization_Ratio_list[i]))\n",
        "        if i < len(Generalization_Ratio_list) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "D751KN1KmABL"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import time\n",
        "import os  # Import the os module\n",
        "\n",
        "os.makedirs(os.path.join('./Models/'), exist_ok=True)  # Create the directory './Models/' if it doesn't exist\n",
        "model_path = './Models/'  # Define the model path\n",
        "\n",
        "rq = time.strftime('%Y%m%d%H%M', time.localtime(time.time()))  # Get the current time in the format 'YYYYMMDDHHMM'\n",
        "\n",
        "# Save the training results\n",
        "current_model_path = model_path + rq + \"_model.pkl\"  # Create the full path for the model file with the current timestamp\n",
        "torch.save(net, current_model_path)  # Save the model to the specified path\n",
        "print(\"Saved model file: \" + current_model_path)  # Print the path of the saved model file"
      ],
      "metadata": {
        "id": "kjP2_kf0mFYH"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Display the highest value that appears during training\n",
        "print(\"train:\", max(a_train))  # Print the highest value in the training data\n",
        "print(\"test:\", max(a_test))  # Print the highest value in the test data\n",
        "print(\"loss:\", min(lossaaa))  # Print the minimum value of the loss"
      ],
      "metadata": {
        "id": "Np1rWV3JmJUn",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "78952464-4d7e-4b34-fc0e-8fac49182fc9"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "train: 0.4241\n",
            "test: 0.3979\n",
            "loss: 1.5480000495910644\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "set = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "testset = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 test dataset\n",
        "trainloader = torch.utils.data.DataLoader(trainset, batch_size=50000, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "t_loader = torch.utils.data.DataLoader(testset, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "trainloader_iter = iter(trainloader)  # Create an iterator for the training DataLoader\n",
        "tl_image, tl_label = next(trainloader_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "tl_image = tl_image.cuda()  # Move training images to GPU\n",
        "tl_label = tl_label.cuda()  # Move training labels to GPU\n",
        "tl_imageoutputs = net(tl_image)  # [batch, 10]  # Get the outputs from the network for the training images\n",
        "predict_y = torch.max(tl_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy = torch.eq(predict_y, tl_label).sum().item() / tl_label.size(0)  # Calculate accuracy for the training set\n",
        "print(\"train:\", float(accuracy))  # Print the training accuracy\n",
        "\n",
        "t_data_iter = iter(t_loader)  # Create an iterator for the test DataLoader\n",
        "t_image, t_label = next(t_data_iter)  # Get the next batch of images and labels from the test DataLoader\n",
        "t_image = t_image.cuda()  # Move test images to GPU\n",
        "t_label = t_label.cuda()  # Move test labels to GPU\n",
        "t_imageoutputs = net(t_image)  # [batch, 10]  # Get the outputs from the network for the test images\n",
        "predict = torch.max(t_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy_t = torch.eq(predict, t_label).sum().item() / t_label.size(0)  # Calculate accuracy for the test set\n",
        "print(\"test:\", float(accuracy_t))  # Print the test accuracy"
      ],
      "metadata": {
        "id": "VuEcsYQGmMqH",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "7948665c-a10e-4fa3-833b-ef787293c832"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "train: 0.39686\n",
            "test: 0.3743\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### **Network2 : use linear layers and active layers + Generalization Decision Process (GDP)**"
      ],
      "metadata": {
        "id": "2La70qLu1sLk"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import argparse\n",
        "import os\n",
        "import numpy as np\n",
        "import torchvision.transforms as transforms\n",
        "from torchvision.utils import save_image\n",
        "from torch.utils.data import DataLoader\n",
        "from torchvision import datasets\n",
        "from torch.autograd import Variable\n",
        "import torch.nn as nn\n",
        "import torch\n",
        "\n",
        "class LANet(nn.Module):\n",
        "    def __init__(self):  # Initialization function\n",
        "        super(LANet, self).__init__()\n",
        "\n",
        "        self.fc1 = nn.Linear(3*32*32, 1000)  # Define the first fully connected layer\n",
        "        self.fc2 = nn.Linear(1000, 500)  # Define the second fully connected layer\n",
        "        self.fc3 = nn.Linear(500, 100)  # Define the third fully connected layer\n",
        "        self.fc4 = nn.Linear(100, 50)  # Define the fourth fully connected layer\n",
        "        self.fc5 = nn.Linear(50, 25)  # Define the fifth fully connected layer\n",
        "        self.fc6 = nn.Linear(25, 20)  # Define the sixth fully connected layer\n",
        "        self.fc7 = nn.Linear(20, 10)  # Define the seventh fully connected layer\n",
        "\n",
        "    def forward(self, x):  # Define the forward pass\n",
        "\n",
        "        x = x.view(-1, 3*32*32)  # Flatten the input tensor\n",
        "        x = F.relu(self.fc1(x))  # Apply ReLU activation after the first layer\n",
        "        x = self.fc2(x)  # Apply the second layer\n",
        "        x = F.relu(self.fc3(x))  # Apply ReLU activation after the third layer\n",
        "        x = self.fc4(x)  # Apply the fourth layer\n",
        "        x = F.relu(self.fc5(x))  # Apply ReLU activation after the fifth layer\n",
        "        x = F.relu(self.fc6(x))  # Apply ReLU activation after the sixth layer\n",
        "        x = self.fc7(x)  # Apply the seventh layer\n",
        "        return x  # Return the output\n",
        "\n",
        "loss_function = torch.nn.CrossEntropyLoss()  # Define the loss function as CrossEntropyLoss\n",
        "net = LANet()  # Instantiate the LANet model\n",
        "# If a GPU is available, run in CUDA mode\n",
        "if torch.cuda.is_available():\n",
        "    net = net.cuda()  # Move the network to the GPU\n",
        "    loss_function = loss_function.cuda()  # Move the loss function to the GPU\n",
        "optimizer_L = torch.optim.Adam(net.parameters(), lr=0.001)  # Initialize the Adam optimizer with learning rate 0.001"
      ],
      "metadata": {
        "id": "X3e-a_Xf13Dh"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "from collections import Counter, defaultdict\n",
        "from itertools import combinations\n",
        "import random\n",
        "\n",
        "a_train = []  # To store training accuracy\n",
        "a_test = []  # To store test accuracy\n",
        "lossaaa = []  # To store loss values\n",
        "Inf = []  # To store information values\n",
        "Var_all = []  # To store all variation values\n",
        "Generalization_Ratio_ = []  # To store generalization ratios\n",
        "dicide_action = []  # To store decision actions\n",
        "loss_before = torch.tensor(30.0)  # Initial loss value\n",
        "los = torch.tensor(30.0)  # Initial loss value\n",
        "dis_before_A1 = torch.tensor(0)  # Distance before action A1\n",
        "dis_before_A2 = torch.tensor(0)  # Distance before action A2\n",
        "dis = torch.tensor(1)  # Distance increment\n",
        "per = \"N\"  # Previous iteration's action\n",
        "state_before = torch.tensor(0.0)  # Previous state value\n",
        "categrary_number = 10  # Number of categories\n",
        "tra_val_number = 2  # Training validation number\n",
        "\n",
        "for epoch in range(5):  # Loop over the dataset multiple times\n",
        "    e3412_iter = iter(e3412_loader)  # Iterator for e3412_loader\n",
        "    running_loss = 0.0  # Running loss\n",
        "    running_loss_all = 0.0  # Running loss for all\n",
        "    loss_before = Variable(loss_before, requires_grad=False)  # Make loss_before a variable\n",
        "    los = Variable(los, requires_grad=False)  # Make los a variable\n",
        "    state_before = Variable(state_before, requires_grad=False)  # Make state_before a variable\n",
        "    dis_before_A1 = Variable(dis_before_A1, requires_grad=False)  # Make dis_before_A1 a variable\n",
        "    dis_before_A2 = Variable(dis_before_A2, requires_grad=False)  # Make dis_before_A2 a variable\n",
        "    acc_A1 = Variable(dis_before_A1, requires_grad=False)  # Make acc_A1 a variable\n",
        "    acc_A2 = Variable(dis_before_A2, requires_grad=False)  # Make acc_A2 a variable\n",
        "    dis_ = Variable(dis, requires_grad=False)  # Make dis a variable\n",
        "\n",
        "    for step, (imgs, labels) in enumerate(e1234_loader):  # Iterate over the data\n",
        "        ### calculate losses\n",
        "        weight_val_probility = 1.0 / tra_val_number  # Weight for validation probability\n",
        "        labels = labels.cuda()  # Move labels to GPU\n",
        "        imgs = imgs.cuda()  # Move images to GPU\n",
        "        out_e1234 = net(imgs)  # Get output from the network\n",
        "        loss_out_e1234 = loss_function(out_e1234, labels)  # Calculate loss for e1234 (A1)\n",
        "\n",
        "        e3412_imgs, e3412_labels = next(e3412_iter)  # Get next batch from e3412_iter\n",
        "        e3412_imgs = e3412_imgs.cuda()  # Move e3412 images to GPU\n",
        "        e3412_labels = e3412_labels.cuda()  # Move e3412 labels to GPU\n",
        "        out_e3412 = net(e3412_imgs)  # Get output from the network\n",
        "        loss_out_e3412 = loss_function(out_e3412, e3412_labels)  # Calculate loss for e3412 (A3)\n",
        "\n",
        "        #################### extract\n",
        "        ## e1 ext count\n",
        "        e12_extracted_loader_image = e12_extracted_loader_image.cuda()  # Move e12 extracted images to GPU\n",
        "        e12_extracted_loader_label = e12_extracted_loader_label.cuda()  # Move e12 extracted labels to GPU\n",
        "        e12_extracted_out = net(e12_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e12_extracted = torch.max(e12_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ## e2 ext count\n",
        "        e34_extracted_loader_image = e34_extracted_loader_image.cuda()  # Move e34 extracted images to GPU\n",
        "        e34_extracted_loader_label = e34_extracted_loader_label.cuda()  # Move e34 extracted labels to GPU\n",
        "        e34_extracted_out = net(e34_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e34_extracted = torch.max(e34_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ########### e1 count\n",
        "        e12_s_loader_image = e12_s_loader_image.cuda()  # Move e12 sample images to GPU\n",
        "        e12_s_loader_label = e12_s_loader_label.cuda()  # Move e12 sample labels to GPU\n",
        "        e12_inform_out = net(e12_s_loader_image).detach()  # Get detached output from the network\n",
        "        e12_inform = torch.max(e12_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e12_inform = torch.chunk(e12_inform, 10)  # Split e12 inform into 10 chunks\n",
        "        split_e12_inform = list(split_e12_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e12_inform)):\n",
        "            counts_E12 = torch.bincount(split_e12_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e12 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e12[category] = counts_E12[category]  # Update counts\n",
        "            split_e12_inform[i] = counts_e12  # Store updated counts\n",
        "\n",
        "        ########### e2 count\n",
        "        e34_s_loader_image = e34_s_loader_image.cuda()  # Move e34 sample images to GPU\n",
        "        e34_s_loader_label = e34_s_loader_label.cuda()  # Move e34 sample labels to GPU\n",
        "        e34_inform_out = net(e34_s_loader_image).detach()  # Get detached output from the network\n",
        "        e34_inform = torch.max(e34_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e34_inform = torch.chunk(e34_inform, 10)  # Split e34 inform into 10 chunks\n",
        "        split_e34_inform = list(split_e34_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e34_inform)):\n",
        "            counts_E34 = torch.bincount(split_e34_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e34 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e34[category] = counts_E34[category]  # Update counts\n",
        "            split_e34_inform[i] = counts_e34  # Store updated counts\n",
        "\n",
        "        ##########\n",
        "        ## IN_IN_pro\n",
        "        counts_i_12 = torch.bincount(e12_inform, minlength=10)  # Count occurrences for e12 inform\n",
        "        counts_i_34 = torch.bincount(e34_inform, minlength=10)  # Count occurrences for e34 inform\n",
        "        counts_in_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_in_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_12[category] = counts_i_12[category]  # Update counts for e12\n",
        "        total_samples_in_12 = len(e12_inform)  # Total samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_34[category] = counts_i_34[category]  # Update counts for e34\n",
        "        total_samples_in_34 = len(e34_inform)  # Total samples in e34\n",
        "\n",
        "        min_denominator_in_12 = total_samples_in_12 * 1e-6  # Minimum denominator for e12\n",
        "        probabilities_in_12 = counts_in_12 / (total_samples_in_12 + min_denominator_in_12)  # Probabilities for e12\n",
        "        probabilities_tensor_in_12 = probabilities_in_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12\n",
        "\n",
        "        min_denominator_in_34 = total_samples_in_34 * 1e-6  # Minimum denominator for e34\n",
        "        probabilities_in_34 = counts_in_34 / (total_samples_in_34 + min_denominator_in_34)  # Probabilities for e34\n",
        "        probabilities_tensor_in_34 = probabilities_in_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34\n",
        "\n",
        "        counts_ext_12 = torch.bincount(e12_extracted, minlength=10)  # Count occurrences for e12 extracted\n",
        "        counts_ext_34 = torch.bincount(e34_extracted, minlength=10)  # Count occurrences for e34 extracted\n",
        "        counts_extra_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_extra_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_12[category] = counts_ext_12[category]  # Update counts for e12 extracted\n",
        "        total_extracted_in_12 = len(e12_extracted)  # Total extracted samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_34[category] = counts_ext_34[category]  # Update counts for e34 extracted\n",
        "        total_extracted_in_34 = len(e34_extracted)  # Total extracted samples in e34\n",
        "\n",
        "        min_denominator_ext_12 = total_extracted_in_12 * 1e-6  # Minimum denominator for e12 extracted\n",
        "        probabilities_ext_12 = counts_extra_12 / (total_extracted_in_12 + min_denominator_ext_12)  # Probabilities for e12 extracted\n",
        "        probabilities_tensor_extra_12 = probabilities_ext_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12 extracted\n",
        "\n",
        "        min_denominator_ext_34 = total_extracted_in_34 * 1e-6  # Minimum denominator for e34 extracted\n",
        "        probabilities_ext_34 = counts_extra_34 / (total_extracted_in_34 + min_denominator_ext_34)  # Probabilities for e34 extracted\n",
        "        probabilities_tensor_extra_34 = probabilities_ext_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34 extracted\n",
        "\n",
        "        ############################### Variation x ###################################\n",
        "        in_12_all = probabilities_tensor_in_12\n",
        "        in_34_all = probabilities_tensor_in_34\n",
        "        in_12_extra = probabilities_tensor_extra_12\n",
        "        in_34_extra = probabilities_tensor_extra_34\n",
        "        weight_tra_probility_all = 1.0 / 2\n",
        "        dow_all = \\\n",
        "              (in_12_all*weight_tra_probility_all + in_34_all*weight_tra_probility_all +\n",
        "              in_12_extra*weight_tra_probility_all + in_34_extra*weight_tra_probility_all + 1e-30)\n",
        "        in_1_all = (in_12_all*weight_tra_probility_all) / dow_all\n",
        "        in_2_all = (in_34_all*weight_tra_probility_all) / dow_all\n",
        "        e_1_all = (in_12_extra*weight_tra_probility_all) / dow_all\n",
        "        e_2_all = (in_34_extra*weight_tra_probility_all) / dow_all\n",
        "        in_1_all = in_1_all[0]\n",
        "        in_2_all = in_2_all[0]\n",
        "        e_1_all = e_1_all[0]\n",
        "        e_2_all = e_2_all[0]\n",
        "        d_KL_all = torch.zeros(10)\n",
        "        k_divergence_all = (in_1_all + 1e-30) * torch.log(in_1_all / (e_1_all + 1e-30) + 1e-30)\n",
        "        k_divergence_all_ = (in_1_all + 1e-30) * torch.log(in_1_all / (e_2_all + 1e-30) + 1e-30)\n",
        "        d_KL_all = torch.max(abs(k_divergence_all))\n",
        "        d_KL_all_ = torch.max(abs(k_divergence_all_))\n",
        "        Variation_all = torch.max(d_KL_all, d_KL_all_)\n",
        "        Var_all.append(Variation_all)\n",
        "\n",
        "        ############################ Information ###################################\n",
        "        all_combinations = list(combinations(range(10), 2))\n",
        "        K = categrary_number * (categrary_number - 1)\n",
        "        result_tensor = torch.zeros(len(all_combinations) * 2)  # Calculate the difference of each pair of combinations and store in result tensor\n",
        "        for c in range(10):\n",
        "            for idx, (i, j) in enumerate(all_combinations):\n",
        "                s1 = abs(((split_e12_inform[c][i]/10) + 1e-30) * torch.log((split_e12_inform[c][i]/10) / ((split_e12_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                s3 = abs(((split_e34_inform[c][i]/10) + 1e-30) * torch.log((split_e34_inform[c][i]/10) / ((split_e34_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                min_value = torch.min(s1, s3)\n",
        "                result_tensor[idx] = min_value.item()\n",
        "                idx_ = idx + len(all_combinations)\n",
        "                s1_ = abs(((split_e12_inform[c][j]/10) + 1e-30) * torch.log((split_e12_inform[c][j]/10) / ((split_e12_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                s3_ = abs(((split_e34_inform[c][j]/10) + 1e-30) * torch.log((split_e34_inform[c][j]/10) / ((split_e34_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                min_value_ = torch.min(s1_, s3_)\n",
        "                result_tensor[idx_] = min_value_.item()\n",
        "        Information = torch.sum(result_tensor) / K\n",
        "        Inf.append(Information)\n",
        "\n",
        "        ############################ Generalization_Ratio ###################################\n",
        "        Generalization_Ratio = Variation_all * (Information + 1.0) / Information\n",
        "        Generalization_Ratio_.append(Generalization_Ratio)\n",
        "\n",
        "        ############################ Generalization Decision Process (GDP) ###################################\n",
        "        state_now = Generalization_Ratio\n",
        "        loss_before = loss_before.cuda()\n",
        "        state_before = state_before.cuda()\n",
        "        state_dis = state_now - state_before\n",
        "        result_tensor = torch.cat((loss_out_e1234.unsqueeze(0), loss_out_e3412.unsqueeze(0)), 0)\n",
        "\n",
        "        # Because two datasets loss_out_e1234 and loss_out_e3412 are used, and there are actions A1 and A2,\n",
        "        # choose one based on the reward\n",
        "        if state_dis >= 0.0:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "        else:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "\n",
        "        ####################################\n",
        "        #### optimizer\n",
        "        los = loss - loss_before\n",
        "        state_before = state_now\n",
        "        optimizer_L.zero_grad()\n",
        "        loss.backward()\n",
        "        optimizer_L.step()\n",
        "        loss_before = loss\n",
        "        running_loss += loss.item()\n",
        "\n",
        "        # Print statistics\n",
        "        if step % 5 == 4:  # Print every 500 mini-batches\n",
        "            with torch.no_grad():  # 'with' is a context manager\n",
        "                s_test_image = s_test_image.cuda()\n",
        "                s_test_label = s_test_label.cuda()\n",
        "                s_tra_image = s_tra_image.cuda()\n",
        "                s_tra_label = s_tra_label.cuda()\n",
        "                outputs = net(s_test_image)  # [batch, 10]\n",
        "                predict_y = torch.max(outputs, dim=1)[1]\n",
        "                accuracy = torch.eq(predict_y, s_test_label).sum().item() / s_test_label.size(0)\n",
        "                a_test.append(float(accuracy))\n",
        "                outputs_t = net(s_tra_image)  # [batch, 10]\n",
        "                predict_y_t = torch.max(outputs_t, dim=1)[1]\n",
        "                accuracy_t = torch.eq(predict_y_t, s_tra_label).sum().item() / s_tra_label.size(0)\n",
        "                a_train.append(float(accuracy_t))\n",
        "                lossaaa.append(float(running_loss / 5))\n",
        "                print('[%d, %5d] train_loss: %.3f train_accuracy: %.3f test_accuracy: %.3f' %\n",
        "                      (epoch + 1, step + 1, running_loss / 5, accuracy_t, accuracy))\n",
        "                running_loss = 0.0\n",
        "                running_loss = 0.0"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "96P5N_Tm2Riu",
        "outputId": "3f60cd8f-5e70-4402-baf1-a88256c757e4"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "[1,     5] train_loss: 0.967 train_accuracy: 0.647 test_accuracy: 0.520\n",
            "[1,    10] train_loss: 1.000 train_accuracy: 0.653 test_accuracy: 0.525\n",
            "[1,    15] train_loss: 1.020 train_accuracy: 0.663 test_accuracy: 0.531\n",
            "[1,    20] train_loss: 0.939 train_accuracy: 0.663 test_accuracy: 0.528\n",
            "[1,    25] train_loss: 0.924 train_accuracy: 0.654 test_accuracy: 0.530\n",
            "[1,    30] train_loss: 0.971 train_accuracy: 0.663 test_accuracy: 0.530\n",
            "[1,    35] train_loss: 1.068 train_accuracy: 0.652 test_accuracy: 0.521\n",
            "[1,    40] train_loss: 0.986 train_accuracy: 0.667 test_accuracy: 0.533\n",
            "[1,    45] train_loss: 1.076 train_accuracy: 0.664 test_accuracy: 0.529\n",
            "[1,    50] train_loss: 1.072 train_accuracy: 0.665 test_accuracy: 0.528\n",
            "[1,    55] train_loss: 0.951 train_accuracy: 0.665 test_accuracy: 0.524\n",
            "[1,    60] train_loss: 0.941 train_accuracy: 0.655 test_accuracy: 0.519\n",
            "[1,    65] train_loss: 0.912 train_accuracy: 0.657 test_accuracy: 0.522\n",
            "[1,    70] train_loss: 1.081 train_accuracy: 0.654 test_accuracy: 0.521\n",
            "[1,    75] train_loss: 1.030 train_accuracy: 0.659 test_accuracy: 0.521\n",
            "[1,    80] train_loss: 1.091 train_accuracy: 0.664 test_accuracy: 0.518\n",
            "[1,    85] train_loss: 1.125 train_accuracy: 0.661 test_accuracy: 0.520\n",
            "[1,    90] train_loss: 1.098 train_accuracy: 0.659 test_accuracy: 0.524\n",
            "[1,    95] train_loss: 0.899 train_accuracy: 0.661 test_accuracy: 0.528\n",
            "[1,   100] train_loss: 0.984 train_accuracy: 0.660 test_accuracy: 0.522\n",
            "[1,   105] train_loss: 1.023 train_accuracy: 0.666 test_accuracy: 0.526\n",
            "[1,   110] train_loss: 0.918 train_accuracy: 0.656 test_accuracy: 0.520\n",
            "[1,   115] train_loss: 1.022 train_accuracy: 0.649 test_accuracy: 0.523\n",
            "[1,   120] train_loss: 0.984 train_accuracy: 0.659 test_accuracy: 0.527\n",
            "[1,   125] train_loss: 0.962 train_accuracy: 0.664 test_accuracy: 0.528\n",
            "[1,   130] train_loss: 0.994 train_accuracy: 0.652 test_accuracy: 0.518\n",
            "[1,   135] train_loss: 1.014 train_accuracy: 0.664 test_accuracy: 0.521\n",
            "[1,   140] train_loss: 0.829 train_accuracy: 0.663 test_accuracy: 0.524\n",
            "[1,   145] train_loss: 0.944 train_accuracy: 0.665 test_accuracy: 0.525\n",
            "[1,   150] train_loss: 1.063 train_accuracy: 0.673 test_accuracy: 0.531\n",
            "[1,   155] train_loss: 0.971 train_accuracy: 0.650 test_accuracy: 0.522\n",
            "[1,   160] train_loss: 1.047 train_accuracy: 0.650 test_accuracy: 0.526\n",
            "[1,   165] train_loss: 1.091 train_accuracy: 0.657 test_accuracy: 0.526\n",
            "[1,   170] train_loss: 1.072 train_accuracy: 0.659 test_accuracy: 0.521\n",
            "[1,   175] train_loss: 0.907 train_accuracy: 0.664 test_accuracy: 0.527\n",
            "[1,   180] train_loss: 1.052 train_accuracy: 0.665 test_accuracy: 0.533\n",
            "[1,   185] train_loss: 0.920 train_accuracy: 0.672 test_accuracy: 0.537\n",
            "[1,   190] train_loss: 0.803 train_accuracy: 0.664 test_accuracy: 0.536\n",
            "[1,   195] train_loss: 1.105 train_accuracy: 0.664 test_accuracy: 0.534\n",
            "[1,   200] train_loss: 1.066 train_accuracy: 0.673 test_accuracy: 0.537\n",
            "[1,   205] train_loss: 0.894 train_accuracy: 0.664 test_accuracy: 0.532\n",
            "[1,   210] train_loss: 0.994 train_accuracy: 0.656 test_accuracy: 0.528\n",
            "[1,   215] train_loss: 0.940 train_accuracy: 0.657 test_accuracy: 0.525\n",
            "[1,   220] train_loss: 0.927 train_accuracy: 0.656 test_accuracy: 0.525\n",
            "[1,   225] train_loss: 0.924 train_accuracy: 0.657 test_accuracy: 0.527\n",
            "[1,   230] train_loss: 0.827 train_accuracy: 0.663 test_accuracy: 0.526\n",
            "[1,   235] train_loss: 0.954 train_accuracy: 0.665 test_accuracy: 0.529\n",
            "[1,   240] train_loss: 0.908 train_accuracy: 0.672 test_accuracy: 0.535\n",
            "[1,   245] train_loss: 1.007 train_accuracy: 0.667 test_accuracy: 0.525\n",
            "[1,   250] train_loss: 0.958 train_accuracy: 0.653 test_accuracy: 0.518\n",
            "[1,   255] train_loss: 0.951 train_accuracy: 0.657 test_accuracy: 0.518\n",
            "[1,   260] train_loss: 0.971 train_accuracy: 0.658 test_accuracy: 0.518\n",
            "[1,   265] train_loss: 1.145 train_accuracy: 0.660 test_accuracy: 0.529\n",
            "[1,   270] train_loss: 1.016 train_accuracy: 0.650 test_accuracy: 0.524\n",
            "[1,   275] train_loss: 0.926 train_accuracy: 0.651 test_accuracy: 0.522\n",
            "[1,   280] train_loss: 1.114 train_accuracy: 0.665 test_accuracy: 0.527\n",
            "[1,   285] train_loss: 0.852 train_accuracy: 0.666 test_accuracy: 0.527\n",
            "[1,   290] train_loss: 1.014 train_accuracy: 0.673 test_accuracy: 0.532\n",
            "[1,   295] train_loss: 1.051 train_accuracy: 0.669 test_accuracy: 0.532\n",
            "[1,   300] train_loss: 1.101 train_accuracy: 0.670 test_accuracy: 0.532\n",
            "[1,   305] train_loss: 1.029 train_accuracy: 0.671 test_accuracy: 0.533\n",
            "[1,   310] train_loss: 0.929 train_accuracy: 0.674 test_accuracy: 0.536\n",
            "[1,   315] train_loss: 0.958 train_accuracy: 0.667 test_accuracy: 0.537\n",
            "[1,   320] train_loss: 1.006 train_accuracy: 0.669 test_accuracy: 0.533\n",
            "[1,   325] train_loss: 0.840 train_accuracy: 0.671 test_accuracy: 0.533\n",
            "[1,   330] train_loss: 0.882 train_accuracy: 0.678 test_accuracy: 0.537\n",
            "[1,   335] train_loss: 0.932 train_accuracy: 0.668 test_accuracy: 0.528\n",
            "[1,   340] train_loss: 0.920 train_accuracy: 0.668 test_accuracy: 0.532\n",
            "[1,   345] train_loss: 0.906 train_accuracy: 0.669 test_accuracy: 0.530\n",
            "[1,   350] train_loss: 0.988 train_accuracy: 0.661 test_accuracy: 0.523\n",
            "[1,   355] train_loss: 1.007 train_accuracy: 0.653 test_accuracy: 0.516\n",
            "[1,   360] train_loss: 0.962 train_accuracy: 0.658 test_accuracy: 0.525\n",
            "[1,   365] train_loss: 0.928 train_accuracy: 0.665 test_accuracy: 0.528\n",
            "[1,   370] train_loss: 0.951 train_accuracy: 0.663 test_accuracy: 0.525\n",
            "[1,   375] train_loss: 0.948 train_accuracy: 0.657 test_accuracy: 0.525\n",
            "[1,   380] train_loss: 1.055 train_accuracy: 0.655 test_accuracy: 0.524\n",
            "[1,   385] train_loss: 0.933 train_accuracy: 0.661 test_accuracy: 0.524\n",
            "[1,   390] train_loss: 0.929 train_accuracy: 0.672 test_accuracy: 0.523\n",
            "[1,   395] train_loss: 1.017 train_accuracy: 0.664 test_accuracy: 0.526\n",
            "[1,   400] train_loss: 1.022 train_accuracy: 0.658 test_accuracy: 0.529\n",
            "[1,   405] train_loss: 0.995 train_accuracy: 0.654 test_accuracy: 0.521\n",
            "[1,   410] train_loss: 0.922 train_accuracy: 0.641 test_accuracy: 0.512\n",
            "[1,   415] train_loss: 0.932 train_accuracy: 0.646 test_accuracy: 0.524\n",
            "[1,   420] train_loss: 1.197 train_accuracy: 0.645 test_accuracy: 0.518\n",
            "[1,   425] train_loss: 1.106 train_accuracy: 0.623 test_accuracy: 0.492\n",
            "[1,   430] train_loss: 1.067 train_accuracy: 0.636 test_accuracy: 0.499\n",
            "[1,   435] train_loss: 1.130 train_accuracy: 0.660 test_accuracy: 0.520\n",
            "[1,   440] train_loss: 0.900 train_accuracy: 0.649 test_accuracy: 0.518\n",
            "[1,   445] train_loss: 0.992 train_accuracy: 0.652 test_accuracy: 0.526\n",
            "[1,   450] train_loss: 0.983 train_accuracy: 0.660 test_accuracy: 0.527\n",
            "[1,   455] train_loss: 1.060 train_accuracy: 0.647 test_accuracy: 0.523\n",
            "[1,   460] train_loss: 1.036 train_accuracy: 0.649 test_accuracy: 0.527\n",
            "[1,   465] train_loss: 0.982 train_accuracy: 0.648 test_accuracy: 0.518\n",
            "[1,   470] train_loss: 0.911 train_accuracy: 0.662 test_accuracy: 0.523\n",
            "[1,   475] train_loss: 0.934 train_accuracy: 0.661 test_accuracy: 0.528\n",
            "[1,   480] train_loss: 0.980 train_accuracy: 0.650 test_accuracy: 0.517\n",
            "[1,   485] train_loss: 0.954 train_accuracy: 0.652 test_accuracy: 0.519\n",
            "[1,   490] train_loss: 0.913 train_accuracy: 0.663 test_accuracy: 0.526\n",
            "[1,   495] train_loss: 0.991 train_accuracy: 0.662 test_accuracy: 0.526\n",
            "[1,   500] train_loss: 1.200 train_accuracy: 0.658 test_accuracy: 0.522\n",
            "[1,   505] train_loss: 1.106 train_accuracy: 0.651 test_accuracy: 0.519\n",
            "[1,   510] train_loss: 1.047 train_accuracy: 0.648 test_accuracy: 0.518\n",
            "[1,   515] train_loss: 1.114 train_accuracy: 0.659 test_accuracy: 0.529\n",
            "[1,   520] train_loss: 0.935 train_accuracy: 0.667 test_accuracy: 0.534\n",
            "[1,   525] train_loss: 1.163 train_accuracy: 0.672 test_accuracy: 0.533\n",
            "[1,   530] train_loss: 1.111 train_accuracy: 0.675 test_accuracy: 0.535\n",
            "[1,   535] train_loss: 0.910 train_accuracy: 0.661 test_accuracy: 0.527\n",
            "[1,   540] train_loss: 1.097 train_accuracy: 0.664 test_accuracy: 0.529\n",
            "[1,   545] train_loss: 1.041 train_accuracy: 0.671 test_accuracy: 0.538\n",
            "[1,   550] train_loss: 1.040 train_accuracy: 0.669 test_accuracy: 0.535\n",
            "[1,   555] train_loss: 1.156 train_accuracy: 0.663 test_accuracy: 0.529\n",
            "[1,   560] train_loss: 0.937 train_accuracy: 0.667 test_accuracy: 0.531\n",
            "[1,   565] train_loss: 1.000 train_accuracy: 0.678 test_accuracy: 0.534\n",
            "[1,   570] train_loss: 1.024 train_accuracy: 0.676 test_accuracy: 0.529\n",
            "[1,   575] train_loss: 0.872 train_accuracy: 0.675 test_accuracy: 0.538\n",
            "[1,   580] train_loss: 0.957 train_accuracy: 0.671 test_accuracy: 0.535\n",
            "[1,   585] train_loss: 1.003 train_accuracy: 0.672 test_accuracy: 0.534\n",
            "[1,   590] train_loss: 1.006 train_accuracy: 0.660 test_accuracy: 0.523\n",
            "[1,   595] train_loss: 0.883 train_accuracy: 0.654 test_accuracy: 0.515\n",
            "[1,   600] train_loss: 0.967 train_accuracy: 0.665 test_accuracy: 0.519\n",
            "[1,   605] train_loss: 0.884 train_accuracy: 0.669 test_accuracy: 0.523\n",
            "[1,   610] train_loss: 0.928 train_accuracy: 0.670 test_accuracy: 0.537\n",
            "[1,   615] train_loss: 1.061 train_accuracy: 0.667 test_accuracy: 0.534\n",
            "[1,   620] train_loss: 0.868 train_accuracy: 0.670 test_accuracy: 0.527\n",
            "[1,   625] train_loss: 0.866 train_accuracy: 0.658 test_accuracy: 0.516\n",
            "[1,   630] train_loss: 1.117 train_accuracy: 0.655 test_accuracy: 0.523\n",
            "[1,   635] train_loss: 1.231 train_accuracy: 0.655 test_accuracy: 0.520\n",
            "[1,   640] train_loss: 1.013 train_accuracy: 0.658 test_accuracy: 0.523\n",
            "[1,   645] train_loss: 0.983 train_accuracy: 0.660 test_accuracy: 0.522\n",
            "[1,   650] train_loss: 1.130 train_accuracy: 0.653 test_accuracy: 0.520\n",
            "[1,   655] train_loss: 1.008 train_accuracy: 0.663 test_accuracy: 0.524\n",
            "[1,   660] train_loss: 0.967 train_accuracy: 0.668 test_accuracy: 0.523\n",
            "[1,   665] train_loss: 0.931 train_accuracy: 0.668 test_accuracy: 0.522\n",
            "[1,   670] train_loss: 1.049 train_accuracy: 0.677 test_accuracy: 0.527\n",
            "[1,   675] train_loss: 1.072 train_accuracy: 0.676 test_accuracy: 0.532\n",
            "[1,   680] train_loss: 0.961 train_accuracy: 0.650 test_accuracy: 0.516\n",
            "[1,   685] train_loss: 1.112 train_accuracy: 0.662 test_accuracy: 0.521\n",
            "[1,   690] train_loss: 0.951 train_accuracy: 0.658 test_accuracy: 0.513\n",
            "[1,   695] train_loss: 0.985 train_accuracy: 0.651 test_accuracy: 0.510\n",
            "[1,   700] train_loss: 1.012 train_accuracy: 0.664 test_accuracy: 0.520\n",
            "[1,   705] train_loss: 1.082 train_accuracy: 0.658 test_accuracy: 0.520\n",
            "[1,   710] train_loss: 1.015 train_accuracy: 0.653 test_accuracy: 0.517\n",
            "[1,   715] train_loss: 0.984 train_accuracy: 0.660 test_accuracy: 0.523\n",
            "[1,   720] train_loss: 0.984 train_accuracy: 0.651 test_accuracy: 0.518\n",
            "[1,   725] train_loss: 1.131 train_accuracy: 0.657 test_accuracy: 0.524\n",
            "[1,   730] train_loss: 1.016 train_accuracy: 0.657 test_accuracy: 0.523\n",
            "[1,   735] train_loss: 0.921 train_accuracy: 0.657 test_accuracy: 0.525\n",
            "[1,   740] train_loss: 1.085 train_accuracy: 0.671 test_accuracy: 0.530\n",
            "[1,   745] train_loss: 1.086 train_accuracy: 0.669 test_accuracy: 0.525\n",
            "[1,   750] train_loss: 1.083 train_accuracy: 0.669 test_accuracy: 0.525\n",
            "[1,   755] train_loss: 0.987 train_accuracy: 0.672 test_accuracy: 0.526\n",
            "[1,   760] train_loss: 0.965 train_accuracy: 0.663 test_accuracy: 0.521\n",
            "[1,   765] train_loss: 0.882 train_accuracy: 0.662 test_accuracy: 0.527\n",
            "[1,   770] train_loss: 1.114 train_accuracy: 0.667 test_accuracy: 0.525\n",
            "[1,   775] train_loss: 1.136 train_accuracy: 0.668 test_accuracy: 0.523\n",
            "[1,   780] train_loss: 1.094 train_accuracy: 0.675 test_accuracy: 0.525\n",
            "[1,   785] train_loss: 0.914 train_accuracy: 0.674 test_accuracy: 0.531\n",
            "[1,   790] train_loss: 1.074 train_accuracy: 0.673 test_accuracy: 0.531\n",
            "[1,   795] train_loss: 0.998 train_accuracy: 0.665 test_accuracy: 0.532\n",
            "[1,   800] train_loss: 0.989 train_accuracy: 0.663 test_accuracy: 0.530\n",
            "[1,   805] train_loss: 0.956 train_accuracy: 0.670 test_accuracy: 0.529\n",
            "[1,   810] train_loss: 0.910 train_accuracy: 0.668 test_accuracy: 0.526\n",
            "[1,   815] train_loss: 1.032 train_accuracy: 0.672 test_accuracy: 0.527\n",
            "[1,   820] train_loss: 1.050 train_accuracy: 0.661 test_accuracy: 0.522\n",
            "[1,   825] train_loss: 1.124 train_accuracy: 0.657 test_accuracy: 0.521\n",
            "[1,   830] train_loss: 0.994 train_accuracy: 0.656 test_accuracy: 0.522\n",
            "[1,   835] train_loss: 1.069 train_accuracy: 0.667 test_accuracy: 0.530\n",
            "[1,   840] train_loss: 0.902 train_accuracy: 0.668 test_accuracy: 0.533\n",
            "[1,   845] train_loss: 0.973 train_accuracy: 0.675 test_accuracy: 0.530\n",
            "[1,   850] train_loss: 0.901 train_accuracy: 0.674 test_accuracy: 0.534\n",
            "[1,   855] train_loss: 1.119 train_accuracy: 0.671 test_accuracy: 0.535\n",
            "[1,   860] train_loss: 1.256 train_accuracy: 0.669 test_accuracy: 0.538\n",
            "[1,   865] train_loss: 0.982 train_accuracy: 0.675 test_accuracy: 0.531\n",
            "[1,   870] train_loss: 1.146 train_accuracy: 0.673 test_accuracy: 0.524\n",
            "[1,   875] train_loss: 0.947 train_accuracy: 0.665 test_accuracy: 0.516\n",
            "[1,   880] train_loss: 1.146 train_accuracy: 0.675 test_accuracy: 0.524\n",
            "[1,   885] train_loss: 0.928 train_accuracy: 0.676 test_accuracy: 0.536\n",
            "[1,   890] train_loss: 1.088 train_accuracy: 0.671 test_accuracy: 0.532\n",
            "[1,   895] train_loss: 1.077 train_accuracy: 0.672 test_accuracy: 0.523\n",
            "[1,   900] train_loss: 0.991 train_accuracy: 0.670 test_accuracy: 0.523\n",
            "[1,   905] train_loss: 1.012 train_accuracy: 0.674 test_accuracy: 0.527\n",
            "[1,   910] train_loss: 0.949 train_accuracy: 0.672 test_accuracy: 0.535\n",
            "[1,   915] train_loss: 1.046 train_accuracy: 0.676 test_accuracy: 0.534\n",
            "[1,   920] train_loss: 1.089 train_accuracy: 0.675 test_accuracy: 0.528\n",
            "[1,   925] train_loss: 0.919 train_accuracy: 0.674 test_accuracy: 0.527\n",
            "[1,   930] train_loss: 0.794 train_accuracy: 0.669 test_accuracy: 0.529\n",
            "[1,   935] train_loss: 1.247 train_accuracy: 0.664 test_accuracy: 0.518\n",
            "[1,   940] train_loss: 1.062 train_accuracy: 0.667 test_accuracy: 0.519\n",
            "[1,   945] train_loss: 0.979 train_accuracy: 0.670 test_accuracy: 0.523\n",
            "[1,   950] train_loss: 0.999 train_accuracy: 0.674 test_accuracy: 0.521\n",
            "[1,   955] train_loss: 1.131 train_accuracy: 0.674 test_accuracy: 0.525\n",
            "[1,   960] train_loss: 1.008 train_accuracy: 0.671 test_accuracy: 0.525\n",
            "[1,   965] train_loss: 1.029 train_accuracy: 0.672 test_accuracy: 0.525\n",
            "[1,   970] train_loss: 1.044 train_accuracy: 0.674 test_accuracy: 0.523\n",
            "[1,   975] train_loss: 0.960 train_accuracy: 0.661 test_accuracy: 0.519\n",
            "[1,   980] train_loss: 1.004 train_accuracy: 0.665 test_accuracy: 0.521\n",
            "[1,   985] train_loss: 1.063 train_accuracy: 0.667 test_accuracy: 0.530\n",
            "[1,   990] train_loss: 0.871 train_accuracy: 0.672 test_accuracy: 0.530\n",
            "[1,   995] train_loss: 1.024 train_accuracy: 0.666 test_accuracy: 0.521\n",
            "[1,  1000] train_loss: 0.999 train_accuracy: 0.677 test_accuracy: 0.529\n",
            "[1,  1005] train_loss: 1.006 train_accuracy: 0.683 test_accuracy: 0.535\n",
            "[1,  1010] train_loss: 1.129 train_accuracy: 0.675 test_accuracy: 0.528\n",
            "[1,  1015] train_loss: 1.059 train_accuracy: 0.680 test_accuracy: 0.534\n",
            "[1,  1020] train_loss: 0.881 train_accuracy: 0.680 test_accuracy: 0.529\n",
            "[1,  1025] train_loss: 1.009 train_accuracy: 0.672 test_accuracy: 0.527\n",
            "[1,  1030] train_loss: 1.031 train_accuracy: 0.677 test_accuracy: 0.525\n",
            "[1,  1035] train_loss: 0.951 train_accuracy: 0.662 test_accuracy: 0.519\n",
            "[1,  1040] train_loss: 0.980 train_accuracy: 0.655 test_accuracy: 0.517\n",
            "[1,  1045] train_loss: 1.113 train_accuracy: 0.667 test_accuracy: 0.523\n",
            "[1,  1050] train_loss: 1.020 train_accuracy: 0.671 test_accuracy: 0.520\n",
            "[1,  1055] train_loss: 1.013 train_accuracy: 0.671 test_accuracy: 0.529\n",
            "[1,  1060] train_loss: 0.927 train_accuracy: 0.665 test_accuracy: 0.526\n",
            "[1,  1065] train_loss: 0.982 train_accuracy: 0.665 test_accuracy: 0.529\n",
            "[1,  1070] train_loss: 1.060 train_accuracy: 0.674 test_accuracy: 0.531\n",
            "[1,  1075] train_loss: 0.977 train_accuracy: 0.669 test_accuracy: 0.532\n",
            "[1,  1080] train_loss: 1.131 train_accuracy: 0.665 test_accuracy: 0.530\n",
            "[1,  1085] train_loss: 1.071 train_accuracy: 0.675 test_accuracy: 0.536\n",
            "[1,  1090] train_loss: 1.054 train_accuracy: 0.668 test_accuracy: 0.524\n",
            "[1,  1095] train_loss: 0.985 train_accuracy: 0.660 test_accuracy: 0.518\n",
            "[1,  1100] train_loss: 1.104 train_accuracy: 0.678 test_accuracy: 0.535\n",
            "[1,  1105] train_loss: 1.050 train_accuracy: 0.681 test_accuracy: 0.537\n",
            "[1,  1110] train_loss: 1.091 train_accuracy: 0.681 test_accuracy: 0.537\n",
            "[1,  1115] train_loss: 0.866 train_accuracy: 0.673 test_accuracy: 0.533\n",
            "[1,  1120] train_loss: 0.984 train_accuracy: 0.676 test_accuracy: 0.533\n",
            "[1,  1125] train_loss: 0.986 train_accuracy: 0.672 test_accuracy: 0.526\n",
            "[1,  1130] train_loss: 1.028 train_accuracy: 0.671 test_accuracy: 0.529\n",
            "[1,  1135] train_loss: 1.003 train_accuracy: 0.667 test_accuracy: 0.525\n",
            "[1,  1140] train_loss: 1.005 train_accuracy: 0.664 test_accuracy: 0.520\n",
            "[1,  1145] train_loss: 0.961 train_accuracy: 0.668 test_accuracy: 0.521\n",
            "[1,  1150] train_loss: 0.974 train_accuracy: 0.666 test_accuracy: 0.526\n",
            "[1,  1155] train_loss: 1.118 train_accuracy: 0.662 test_accuracy: 0.519\n",
            "[1,  1160] train_loss: 0.916 train_accuracy: 0.662 test_accuracy: 0.514\n",
            "[1,  1165] train_loss: 0.868 train_accuracy: 0.676 test_accuracy: 0.525\n",
            "[1,  1170] train_loss: 0.986 train_accuracy: 0.679 test_accuracy: 0.531\n",
            "[1,  1175] train_loss: 1.162 train_accuracy: 0.680 test_accuracy: 0.530\n",
            "[1,  1180] train_loss: 1.070 train_accuracy: 0.677 test_accuracy: 0.525\n",
            "[1,  1185] train_loss: 1.089 train_accuracy: 0.648 test_accuracy: 0.505\n",
            "[1,  1190] train_loss: 1.218 train_accuracy: 0.645 test_accuracy: 0.495\n",
            "[1,  1195] train_loss: 1.050 train_accuracy: 0.654 test_accuracy: 0.508\n",
            "[1,  1200] train_loss: 0.999 train_accuracy: 0.655 test_accuracy: 0.514\n",
            "[1,  1205] train_loss: 1.069 train_accuracy: 0.668 test_accuracy: 0.530\n",
            "[1,  1210] train_loss: 1.061 train_accuracy: 0.669 test_accuracy: 0.527\n",
            "[1,  1215] train_loss: 0.961 train_accuracy: 0.673 test_accuracy: 0.531\n",
            "[1,  1220] train_loss: 0.983 train_accuracy: 0.673 test_accuracy: 0.535\n",
            "[1,  1225] train_loss: 0.817 train_accuracy: 0.664 test_accuracy: 0.531\n",
            "[1,  1230] train_loss: 1.064 train_accuracy: 0.667 test_accuracy: 0.534\n",
            "[1,  1235] train_loss: 1.000 train_accuracy: 0.670 test_accuracy: 0.527\n",
            "[1,  1240] train_loss: 1.079 train_accuracy: 0.656 test_accuracy: 0.515\n",
            "[1,  1245] train_loss: 0.991 train_accuracy: 0.668 test_accuracy: 0.523\n",
            "[2,     5] train_loss: 0.892 train_accuracy: 0.654 test_accuracy: 0.518\n",
            "[2,    10] train_loss: 1.099 train_accuracy: 0.664 test_accuracy: 0.525\n",
            "[2,    15] train_loss: 0.911 train_accuracy: 0.669 test_accuracy: 0.526\n",
            "[2,    20] train_loss: 0.921 train_accuracy: 0.675 test_accuracy: 0.525\n",
            "[2,    25] train_loss: 0.926 train_accuracy: 0.682 test_accuracy: 0.528\n",
            "[2,    30] train_loss: 0.850 train_accuracy: 0.676 test_accuracy: 0.525\n",
            "[2,    35] train_loss: 0.944 train_accuracy: 0.684 test_accuracy: 0.526\n",
            "[2,    40] train_loss: 0.843 train_accuracy: 0.685 test_accuracy: 0.528\n",
            "[2,    45] train_loss: 0.946 train_accuracy: 0.681 test_accuracy: 0.525\n",
            "[2,    50] train_loss: 0.951 train_accuracy: 0.676 test_accuracy: 0.522\n",
            "[2,    55] train_loss: 0.994 train_accuracy: 0.678 test_accuracy: 0.522\n",
            "[2,    60] train_loss: 1.037 train_accuracy: 0.673 test_accuracy: 0.519\n",
            "[2,    65] train_loss: 0.914 train_accuracy: 0.666 test_accuracy: 0.512\n",
            "[2,    70] train_loss: 1.035 train_accuracy: 0.660 test_accuracy: 0.512\n",
            "[2,    75] train_loss: 0.925 train_accuracy: 0.670 test_accuracy: 0.521\n",
            "[2,    80] train_loss: 0.817 train_accuracy: 0.688 test_accuracy: 0.528\n",
            "[2,    85] train_loss: 0.930 train_accuracy: 0.688 test_accuracy: 0.534\n",
            "[2,    90] train_loss: 0.966 train_accuracy: 0.668 test_accuracy: 0.527\n",
            "[2,    95] train_loss: 0.890 train_accuracy: 0.674 test_accuracy: 0.528\n",
            "[2,   100] train_loss: 0.766 train_accuracy: 0.679 test_accuracy: 0.532\n",
            "[2,   105] train_loss: 1.132 train_accuracy: 0.690 test_accuracy: 0.537\n",
            "[2,   110] train_loss: 0.905 train_accuracy: 0.686 test_accuracy: 0.534\n",
            "[2,   115] train_loss: 0.965 train_accuracy: 0.677 test_accuracy: 0.523\n",
            "[2,   120] train_loss: 0.917 train_accuracy: 0.676 test_accuracy: 0.525\n",
            "[2,   125] train_loss: 0.867 train_accuracy: 0.662 test_accuracy: 0.516\n",
            "[2,   130] train_loss: 0.869 train_accuracy: 0.670 test_accuracy: 0.525\n",
            "[2,   135] train_loss: 0.987 train_accuracy: 0.671 test_accuracy: 0.524\n",
            "[2,   140] train_loss: 0.928 train_accuracy: 0.664 test_accuracy: 0.523\n",
            "[2,   145] train_loss: 0.999 train_accuracy: 0.675 test_accuracy: 0.530\n",
            "[2,   150] train_loss: 0.888 train_accuracy: 0.677 test_accuracy: 0.527\n",
            "[2,   155] train_loss: 0.853 train_accuracy: 0.677 test_accuracy: 0.528\n",
            "[2,   160] train_loss: 1.005 train_accuracy: 0.666 test_accuracy: 0.524\n",
            "[2,   165] train_loss: 1.027 train_accuracy: 0.669 test_accuracy: 0.524\n",
            "[2,   170] train_loss: 0.878 train_accuracy: 0.670 test_accuracy: 0.524\n",
            "[2,   175] train_loss: 0.921 train_accuracy: 0.673 test_accuracy: 0.527\n",
            "[2,   180] train_loss: 0.961 train_accuracy: 0.671 test_accuracy: 0.527\n",
            "[2,   185] train_loss: 0.946 train_accuracy: 0.673 test_accuracy: 0.528\n",
            "[2,   190] train_loss: 0.893 train_accuracy: 0.670 test_accuracy: 0.520\n",
            "[2,   195] train_loss: 0.934 train_accuracy: 0.677 test_accuracy: 0.527\n",
            "[2,   200] train_loss: 1.029 train_accuracy: 0.685 test_accuracy: 0.531\n",
            "[2,   205] train_loss: 0.935 train_accuracy: 0.688 test_accuracy: 0.530\n",
            "[2,   210] train_loss: 0.840 train_accuracy: 0.679 test_accuracy: 0.533\n",
            "[2,   215] train_loss: 0.935 train_accuracy: 0.682 test_accuracy: 0.535\n",
            "[2,   220] train_loss: 0.894 train_accuracy: 0.668 test_accuracy: 0.528\n",
            "[2,   225] train_loss: 0.939 train_accuracy: 0.664 test_accuracy: 0.520\n",
            "[2,   230] train_loss: 0.869 train_accuracy: 0.667 test_accuracy: 0.518\n",
            "[2,   235] train_loss: 0.929 train_accuracy: 0.672 test_accuracy: 0.520\n",
            "[2,   240] train_loss: 0.921 train_accuracy: 0.668 test_accuracy: 0.520\n",
            "[2,   245] train_loss: 0.942 train_accuracy: 0.689 test_accuracy: 0.538\n",
            "[2,   250] train_loss: 0.836 train_accuracy: 0.686 test_accuracy: 0.538\n",
            "[2,   255] train_loss: 0.880 train_accuracy: 0.684 test_accuracy: 0.528\n",
            "[2,   260] train_loss: 1.026 train_accuracy: 0.685 test_accuracy: 0.520\n",
            "[2,   265] train_loss: 0.950 train_accuracy: 0.669 test_accuracy: 0.511\n",
            "[2,   270] train_loss: 0.899 train_accuracy: 0.673 test_accuracy: 0.513\n",
            "[2,   275] train_loss: 0.980 train_accuracy: 0.680 test_accuracy: 0.522\n",
            "[2,   280] train_loss: 1.073 train_accuracy: 0.672 test_accuracy: 0.519\n",
            "[2,   285] train_loss: 1.026 train_accuracy: 0.673 test_accuracy: 0.522\n",
            "[2,   290] train_loss: 0.948 train_accuracy: 0.671 test_accuracy: 0.518\n",
            "[2,   295] train_loss: 1.041 train_accuracy: 0.673 test_accuracy: 0.521\n",
            "[2,   300] train_loss: 0.883 train_accuracy: 0.685 test_accuracy: 0.526\n",
            "[2,   305] train_loss: 0.928 train_accuracy: 0.682 test_accuracy: 0.528\n",
            "[2,   310] train_loss: 1.050 train_accuracy: 0.673 test_accuracy: 0.527\n",
            "[2,   315] train_loss: 0.847 train_accuracy: 0.676 test_accuracy: 0.530\n",
            "[2,   320] train_loss: 1.053 train_accuracy: 0.692 test_accuracy: 0.534\n",
            "[2,   325] train_loss: 0.943 train_accuracy: 0.683 test_accuracy: 0.530\n",
            "[2,   330] train_loss: 0.800 train_accuracy: 0.676 test_accuracy: 0.523\n",
            "[2,   335] train_loss: 1.036 train_accuracy: 0.680 test_accuracy: 0.533\n",
            "[2,   340] train_loss: 0.892 train_accuracy: 0.680 test_accuracy: 0.533\n",
            "[2,   345] train_loss: 0.891 train_accuracy: 0.659 test_accuracy: 0.517\n",
            "[2,   350] train_loss: 0.942 train_accuracy: 0.657 test_accuracy: 0.520\n",
            "[2,   355] train_loss: 1.141 train_accuracy: 0.672 test_accuracy: 0.527\n",
            "[2,   360] train_loss: 0.913 train_accuracy: 0.661 test_accuracy: 0.515\n",
            "[2,   365] train_loss: 0.968 train_accuracy: 0.663 test_accuracy: 0.515\n",
            "[2,   370] train_loss: 0.889 train_accuracy: 0.680 test_accuracy: 0.531\n",
            "[2,   375] train_loss: 0.927 train_accuracy: 0.685 test_accuracy: 0.529\n",
            "[2,   380] train_loss: 0.948 train_accuracy: 0.677 test_accuracy: 0.523\n",
            "[2,   385] train_loss: 0.925 train_accuracy: 0.676 test_accuracy: 0.523\n",
            "[2,   390] train_loss: 0.844 train_accuracy: 0.683 test_accuracy: 0.531\n",
            "[2,   395] train_loss: 0.950 train_accuracy: 0.675 test_accuracy: 0.526\n",
            "[2,   400] train_loss: 1.102 train_accuracy: 0.668 test_accuracy: 0.520\n",
            "[2,   405] train_loss: 1.050 train_accuracy: 0.665 test_accuracy: 0.518\n",
            "[2,   410] train_loss: 0.878 train_accuracy: 0.673 test_accuracy: 0.525\n",
            "[2,   415] train_loss: 0.898 train_accuracy: 0.683 test_accuracy: 0.523\n",
            "[2,   420] train_loss: 0.992 train_accuracy: 0.684 test_accuracy: 0.525\n",
            "[2,   425] train_loss: 1.011 train_accuracy: 0.686 test_accuracy: 0.530\n",
            "[2,   430] train_loss: 0.901 train_accuracy: 0.692 test_accuracy: 0.533\n",
            "[2,   435] train_loss: 0.925 train_accuracy: 0.687 test_accuracy: 0.535\n",
            "[2,   440] train_loss: 0.906 train_accuracy: 0.682 test_accuracy: 0.524\n",
            "[2,   445] train_loss: 0.930 train_accuracy: 0.683 test_accuracy: 0.523\n",
            "[2,   450] train_loss: 0.875 train_accuracy: 0.678 test_accuracy: 0.529\n",
            "[2,   455] train_loss: 1.072 train_accuracy: 0.666 test_accuracy: 0.524\n",
            "[2,   460] train_loss: 0.943 train_accuracy: 0.664 test_accuracy: 0.516\n",
            "[2,   465] train_loss: 0.928 train_accuracy: 0.663 test_accuracy: 0.511\n",
            "[2,   470] train_loss: 1.030 train_accuracy: 0.683 test_accuracy: 0.516\n",
            "[2,   475] train_loss: 1.045 train_accuracy: 0.678 test_accuracy: 0.520\n",
            "[2,   480] train_loss: 0.992 train_accuracy: 0.679 test_accuracy: 0.524\n",
            "[2,   485] train_loss: 0.830 train_accuracy: 0.679 test_accuracy: 0.527\n",
            "[2,   490] train_loss: 0.868 train_accuracy: 0.678 test_accuracy: 0.523\n",
            "[2,   495] train_loss: 1.045 train_accuracy: 0.686 test_accuracy: 0.528\n",
            "[2,   500] train_loss: 0.900 train_accuracy: 0.683 test_accuracy: 0.526\n",
            "[2,   505] train_loss: 1.171 train_accuracy: 0.673 test_accuracy: 0.521\n",
            "[2,   510] train_loss: 0.970 train_accuracy: 0.681 test_accuracy: 0.522\n",
            "[2,   515] train_loss: 0.877 train_accuracy: 0.687 test_accuracy: 0.524\n",
            "[2,   520] train_loss: 0.903 train_accuracy: 0.682 test_accuracy: 0.527\n",
            "[2,   525] train_loss: 0.842 train_accuracy: 0.679 test_accuracy: 0.524\n",
            "[2,   530] train_loss: 0.931 train_accuracy: 0.675 test_accuracy: 0.520\n",
            "[2,   535] train_loss: 1.003 train_accuracy: 0.675 test_accuracy: 0.518\n",
            "[2,   540] train_loss: 1.063 train_accuracy: 0.662 test_accuracy: 0.517\n",
            "[2,   545] train_loss: 0.946 train_accuracy: 0.673 test_accuracy: 0.526\n",
            "[2,   550] train_loss: 0.864 train_accuracy: 0.684 test_accuracy: 0.528\n",
            "[2,   555] train_loss: 1.026 train_accuracy: 0.683 test_accuracy: 0.530\n",
            "[2,   560] train_loss: 0.838 train_accuracy: 0.677 test_accuracy: 0.525\n",
            "[2,   565] train_loss: 1.150 train_accuracy: 0.692 test_accuracy: 0.535\n",
            "[2,   570] train_loss: 1.152 train_accuracy: 0.682 test_accuracy: 0.531\n",
            "[2,   575] train_loss: 0.983 train_accuracy: 0.673 test_accuracy: 0.521\n",
            "[2,   580] train_loss: 1.018 train_accuracy: 0.671 test_accuracy: 0.518\n",
            "[2,   585] train_loss: 1.055 train_accuracy: 0.681 test_accuracy: 0.528\n",
            "[2,   590] train_loss: 0.968 train_accuracy: 0.686 test_accuracy: 0.531\n",
            "[2,   595] train_loss: 0.995 train_accuracy: 0.688 test_accuracy: 0.526\n",
            "[2,   600] train_loss: 0.757 train_accuracy: 0.676 test_accuracy: 0.519\n",
            "[2,   605] train_loss: 1.015 train_accuracy: 0.674 test_accuracy: 0.519\n",
            "[2,   610] train_loss: 1.100 train_accuracy: 0.665 test_accuracy: 0.516\n",
            "[2,   615] train_loss: 0.975 train_accuracy: 0.670 test_accuracy: 0.522\n",
            "[2,   620] train_loss: 1.052 train_accuracy: 0.671 test_accuracy: 0.521\n",
            "[2,   625] train_loss: 1.019 train_accuracy: 0.673 test_accuracy: 0.523\n",
            "[2,   630] train_loss: 1.060 train_accuracy: 0.683 test_accuracy: 0.530\n",
            "[2,   635] train_loss: 0.889 train_accuracy: 0.679 test_accuracy: 0.530\n",
            "[2,   640] train_loss: 1.027 train_accuracy: 0.678 test_accuracy: 0.527\n",
            "[2,   645] train_loss: 0.930 train_accuracy: 0.676 test_accuracy: 0.524\n",
            "[2,   650] train_loss: 0.846 train_accuracy: 0.680 test_accuracy: 0.524\n",
            "[2,   655] train_loss: 0.886 train_accuracy: 0.690 test_accuracy: 0.529\n",
            "[2,   660] train_loss: 0.846 train_accuracy: 0.678 test_accuracy: 0.519\n",
            "[2,   665] train_loss: 1.055 train_accuracy: 0.669 test_accuracy: 0.513\n",
            "[2,   670] train_loss: 1.081 train_accuracy: 0.683 test_accuracy: 0.520\n",
            "[2,   675] train_loss: 0.949 train_accuracy: 0.691 test_accuracy: 0.528\n",
            "[2,   680] train_loss: 0.909 train_accuracy: 0.686 test_accuracy: 0.525\n",
            "[2,   685] train_loss: 0.871 train_accuracy: 0.683 test_accuracy: 0.528\n",
            "[2,   690] train_loss: 0.808 train_accuracy: 0.691 test_accuracy: 0.530\n",
            "[2,   695] train_loss: 0.948 train_accuracy: 0.684 test_accuracy: 0.530\n",
            "[2,   700] train_loss: 0.991 train_accuracy: 0.686 test_accuracy: 0.525\n",
            "[2,   705] train_loss: 0.759 train_accuracy: 0.676 test_accuracy: 0.520\n",
            "[2,   710] train_loss: 1.059 train_accuracy: 0.681 test_accuracy: 0.528\n",
            "[2,   715] train_loss: 0.867 train_accuracy: 0.668 test_accuracy: 0.523\n",
            "[2,   720] train_loss: 0.976 train_accuracy: 0.679 test_accuracy: 0.529\n",
            "[2,   725] train_loss: 0.798 train_accuracy: 0.677 test_accuracy: 0.525\n",
            "[2,   730] train_loss: 1.018 train_accuracy: 0.680 test_accuracy: 0.527\n",
            "[2,   735] train_loss: 1.164 train_accuracy: 0.683 test_accuracy: 0.532\n",
            "[2,   740] train_loss: 0.891 train_accuracy: 0.683 test_accuracy: 0.531\n",
            "[2,   745] train_loss: 0.924 train_accuracy: 0.684 test_accuracy: 0.529\n",
            "[2,   750] train_loss: 0.962 train_accuracy: 0.695 test_accuracy: 0.533\n",
            "[2,   755] train_loss: 0.939 train_accuracy: 0.686 test_accuracy: 0.528\n",
            "[2,   760] train_loss: 0.858 train_accuracy: 0.680 test_accuracy: 0.526\n",
            "[2,   765] train_loss: 0.876 train_accuracy: 0.678 test_accuracy: 0.523\n",
            "[2,   770] train_loss: 1.084 train_accuracy: 0.672 test_accuracy: 0.526\n",
            "[2,   775] train_loss: 1.164 train_accuracy: 0.676 test_accuracy: 0.524\n",
            "[2,   780] train_loss: 1.008 train_accuracy: 0.667 test_accuracy: 0.514\n",
            "[2,   785] train_loss: 0.959 train_accuracy: 0.671 test_accuracy: 0.514\n",
            "[2,   790] train_loss: 1.047 train_accuracy: 0.670 test_accuracy: 0.512\n",
            "[2,   795] train_loss: 0.915 train_accuracy: 0.668 test_accuracy: 0.514\n",
            "[2,   800] train_loss: 1.071 train_accuracy: 0.674 test_accuracy: 0.516\n",
            "[2,   805] train_loss: 0.820 train_accuracy: 0.684 test_accuracy: 0.522\n",
            "[2,   810] train_loss: 0.851 train_accuracy: 0.676 test_accuracy: 0.522\n",
            "[2,   815] train_loss: 1.080 train_accuracy: 0.682 test_accuracy: 0.529\n",
            "[2,   820] train_loss: 1.089 train_accuracy: 0.681 test_accuracy: 0.526\n",
            "[2,   825] train_loss: 0.923 train_accuracy: 0.674 test_accuracy: 0.520\n",
            "[2,   830] train_loss: 1.068 train_accuracy: 0.672 test_accuracy: 0.523\n",
            "[2,   835] train_loss: 0.920 train_accuracy: 0.681 test_accuracy: 0.530\n",
            "[2,   840] train_loss: 0.873 train_accuracy: 0.673 test_accuracy: 0.525\n",
            "[2,   845] train_loss: 1.025 train_accuracy: 0.682 test_accuracy: 0.533\n",
            "[2,   850] train_loss: 1.065 train_accuracy: 0.692 test_accuracy: 0.532\n",
            "[2,   855] train_loss: 1.002 train_accuracy: 0.673 test_accuracy: 0.516\n",
            "[2,   860] train_loss: 0.896 train_accuracy: 0.670 test_accuracy: 0.517\n",
            "[2,   865] train_loss: 1.005 train_accuracy: 0.690 test_accuracy: 0.534\n",
            "[2,   870] train_loss: 0.891 train_accuracy: 0.678 test_accuracy: 0.531\n",
            "[2,   875] train_loss: 0.986 train_accuracy: 0.696 test_accuracy: 0.530\n",
            "[2,   880] train_loss: 0.925 train_accuracy: 0.698 test_accuracy: 0.532\n",
            "[2,   885] train_loss: 0.927 train_accuracy: 0.693 test_accuracy: 0.530\n",
            "[2,   890] train_loss: 1.052 train_accuracy: 0.689 test_accuracy: 0.529\n",
            "[2,   895] train_loss: 0.851 train_accuracy: 0.684 test_accuracy: 0.532\n",
            "[2,   900] train_loss: 0.929 train_accuracy: 0.680 test_accuracy: 0.525\n",
            "[2,   905] train_loss: 1.088 train_accuracy: 0.683 test_accuracy: 0.524\n",
            "[2,   910] train_loss: 1.080 train_accuracy: 0.679 test_accuracy: 0.515\n",
            "[2,   915] train_loss: 0.972 train_accuracy: 0.673 test_accuracy: 0.512\n",
            "[2,   920] train_loss: 0.891 train_accuracy: 0.666 test_accuracy: 0.508\n",
            "[2,   925] train_loss: 0.948 train_accuracy: 0.661 test_accuracy: 0.508\n",
            "[2,   930] train_loss: 0.937 train_accuracy: 0.673 test_accuracy: 0.516\n",
            "[2,   935] train_loss: 0.979 train_accuracy: 0.685 test_accuracy: 0.531\n",
            "[2,   940] train_loss: 0.918 train_accuracy: 0.688 test_accuracy: 0.528\n",
            "[2,   945] train_loss: 1.075 train_accuracy: 0.695 test_accuracy: 0.535\n",
            "[2,   950] train_loss: 0.993 train_accuracy: 0.698 test_accuracy: 0.534\n",
            "[2,   955] train_loss: 0.866 train_accuracy: 0.692 test_accuracy: 0.530\n",
            "[2,   960] train_loss: 1.159 train_accuracy: 0.687 test_accuracy: 0.530\n",
            "[2,   965] train_loss: 0.974 train_accuracy: 0.686 test_accuracy: 0.532\n",
            "[2,   970] train_loss: 0.922 train_accuracy: 0.683 test_accuracy: 0.528\n",
            "[2,   975] train_loss: 0.967 train_accuracy: 0.695 test_accuracy: 0.533\n",
            "[2,   980] train_loss: 0.998 train_accuracy: 0.693 test_accuracy: 0.534\n",
            "[2,   985] train_loss: 0.943 train_accuracy: 0.687 test_accuracy: 0.526\n",
            "[2,   990] train_loss: 0.970 train_accuracy: 0.692 test_accuracy: 0.532\n",
            "[2,   995] train_loss: 0.950 train_accuracy: 0.690 test_accuracy: 0.532\n",
            "[2,  1000] train_loss: 0.794 train_accuracy: 0.682 test_accuracy: 0.529\n",
            "[2,  1005] train_loss: 0.991 train_accuracy: 0.696 test_accuracy: 0.540\n",
            "[2,  1010] train_loss: 0.956 train_accuracy: 0.681 test_accuracy: 0.519\n",
            "[2,  1015] train_loss: 0.980 train_accuracy: 0.682 test_accuracy: 0.523\n",
            "[2,  1020] train_loss: 0.946 train_accuracy: 0.689 test_accuracy: 0.531\n",
            "[2,  1025] train_loss: 0.857 train_accuracy: 0.685 test_accuracy: 0.523\n",
            "[2,  1030] train_loss: 0.942 train_accuracy: 0.682 test_accuracy: 0.516\n",
            "[2,  1035] train_loss: 1.178 train_accuracy: 0.678 test_accuracy: 0.517\n",
            "[2,  1040] train_loss: 0.962 train_accuracy: 0.690 test_accuracy: 0.525\n",
            "[2,  1045] train_loss: 1.007 train_accuracy: 0.699 test_accuracy: 0.529\n",
            "[2,  1050] train_loss: 0.955 train_accuracy: 0.686 test_accuracy: 0.519\n",
            "[2,  1055] train_loss: 0.983 train_accuracy: 0.687 test_accuracy: 0.524\n",
            "[2,  1060] train_loss: 1.008 train_accuracy: 0.689 test_accuracy: 0.531\n",
            "[2,  1065] train_loss: 0.927 train_accuracy: 0.684 test_accuracy: 0.536\n",
            "[2,  1070] train_loss: 1.086 train_accuracy: 0.677 test_accuracy: 0.526\n",
            "[2,  1075] train_loss: 1.032 train_accuracy: 0.684 test_accuracy: 0.528\n",
            "[2,  1080] train_loss: 0.854 train_accuracy: 0.684 test_accuracy: 0.529\n",
            "[2,  1085] train_loss: 0.961 train_accuracy: 0.680 test_accuracy: 0.524\n",
            "[2,  1090] train_loss: 1.014 train_accuracy: 0.686 test_accuracy: 0.520\n",
            "[2,  1095] train_loss: 0.840 train_accuracy: 0.683 test_accuracy: 0.521\n",
            "[2,  1100] train_loss: 1.105 train_accuracy: 0.686 test_accuracy: 0.532\n",
            "[2,  1105] train_loss: 1.010 train_accuracy: 0.686 test_accuracy: 0.530\n",
            "[2,  1110] train_loss: 0.962 train_accuracy: 0.672 test_accuracy: 0.523\n",
            "[2,  1115] train_loss: 0.880 train_accuracy: 0.673 test_accuracy: 0.527\n",
            "[2,  1120] train_loss: 0.887 train_accuracy: 0.676 test_accuracy: 0.524\n",
            "[2,  1125] train_loss: 1.136 train_accuracy: 0.676 test_accuracy: 0.521\n",
            "[2,  1130] train_loss: 1.056 train_accuracy: 0.677 test_accuracy: 0.516\n",
            "[2,  1135] train_loss: 1.192 train_accuracy: 0.672 test_accuracy: 0.521\n",
            "[2,  1140] train_loss: 1.022 train_accuracy: 0.680 test_accuracy: 0.521\n",
            "[2,  1145] train_loss: 0.921 train_accuracy: 0.677 test_accuracy: 0.517\n",
            "[2,  1150] train_loss: 1.007 train_accuracy: 0.677 test_accuracy: 0.517\n",
            "[2,  1155] train_loss: 1.003 train_accuracy: 0.687 test_accuracy: 0.524\n",
            "[2,  1160] train_loss: 1.162 train_accuracy: 0.688 test_accuracy: 0.523\n",
            "[2,  1165] train_loss: 0.972 train_accuracy: 0.689 test_accuracy: 0.526\n",
            "[2,  1170] train_loss: 0.849 train_accuracy: 0.686 test_accuracy: 0.524\n",
            "[2,  1175] train_loss: 0.937 train_accuracy: 0.683 test_accuracy: 0.523\n",
            "[2,  1180] train_loss: 0.969 train_accuracy: 0.690 test_accuracy: 0.523\n",
            "[2,  1185] train_loss: 1.052 train_accuracy: 0.688 test_accuracy: 0.520\n",
            "[2,  1190] train_loss: 1.049 train_accuracy: 0.699 test_accuracy: 0.537\n",
            "[2,  1195] train_loss: 1.019 train_accuracy: 0.693 test_accuracy: 0.531\n",
            "[2,  1200] train_loss: 0.952 train_accuracy: 0.696 test_accuracy: 0.535\n",
            "[2,  1205] train_loss: 0.934 train_accuracy: 0.701 test_accuracy: 0.533\n",
            "[2,  1210] train_loss: 1.053 train_accuracy: 0.692 test_accuracy: 0.523\n",
            "[2,  1215] train_loss: 0.946 train_accuracy: 0.689 test_accuracy: 0.523\n",
            "[2,  1220] train_loss: 1.097 train_accuracy: 0.680 test_accuracy: 0.527\n",
            "[2,  1225] train_loss: 0.965 train_accuracy: 0.677 test_accuracy: 0.526\n",
            "[2,  1230] train_loss: 0.967 train_accuracy: 0.665 test_accuracy: 0.523\n",
            "[2,  1235] train_loss: 0.979 train_accuracy: 0.670 test_accuracy: 0.523\n",
            "[2,  1240] train_loss: 1.062 train_accuracy: 0.669 test_accuracy: 0.520\n",
            "[2,  1245] train_loss: 0.910 train_accuracy: 0.670 test_accuracy: 0.521\n",
            "[3,     5] train_loss: 0.963 train_accuracy: 0.682 test_accuracy: 0.529\n",
            "[3,    10] train_loss: 0.995 train_accuracy: 0.684 test_accuracy: 0.533\n",
            "[3,    15] train_loss: 0.962 train_accuracy: 0.689 test_accuracy: 0.535\n",
            "[3,    20] train_loss: 0.969 train_accuracy: 0.700 test_accuracy: 0.535\n",
            "[3,    25] train_loss: 0.917 train_accuracy: 0.694 test_accuracy: 0.531\n",
            "[3,    30] train_loss: 0.935 train_accuracy: 0.695 test_accuracy: 0.528\n",
            "[3,    35] train_loss: 0.814 train_accuracy: 0.694 test_accuracy: 0.533\n",
            "[3,    40] train_loss: 0.938 train_accuracy: 0.694 test_accuracy: 0.531\n",
            "[3,    45] train_loss: 0.879 train_accuracy: 0.685 test_accuracy: 0.525\n",
            "[3,    50] train_loss: 0.893 train_accuracy: 0.688 test_accuracy: 0.517\n",
            "[3,    55] train_loss: 0.786 train_accuracy: 0.689 test_accuracy: 0.516\n",
            "[3,    60] train_loss: 0.941 train_accuracy: 0.693 test_accuracy: 0.524\n",
            "[3,    65] train_loss: 0.959 train_accuracy: 0.688 test_accuracy: 0.531\n",
            "[3,    70] train_loss: 1.042 train_accuracy: 0.702 test_accuracy: 0.536\n",
            "[3,    75] train_loss: 0.632 train_accuracy: 0.695 test_accuracy: 0.534\n",
            "[3,    80] train_loss: 0.905 train_accuracy: 0.693 test_accuracy: 0.532\n",
            "[3,    85] train_loss: 0.885 train_accuracy: 0.697 test_accuracy: 0.528\n",
            "[3,    90] train_loss: 0.941 train_accuracy: 0.702 test_accuracy: 0.526\n",
            "[3,    95] train_loss: 0.982 train_accuracy: 0.692 test_accuracy: 0.526\n",
            "[3,   100] train_loss: 1.066 train_accuracy: 0.688 test_accuracy: 0.527\n",
            "[3,   105] train_loss: 0.956 train_accuracy: 0.691 test_accuracy: 0.524\n",
            "[3,   110] train_loss: 0.894 train_accuracy: 0.698 test_accuracy: 0.530\n",
            "[3,   115] train_loss: 0.940 train_accuracy: 0.688 test_accuracy: 0.525\n",
            "[3,   120] train_loss: 0.817 train_accuracy: 0.694 test_accuracy: 0.524\n",
            "[3,   125] train_loss: 0.926 train_accuracy: 0.694 test_accuracy: 0.524\n",
            "[3,   130] train_loss: 0.786 train_accuracy: 0.693 test_accuracy: 0.525\n",
            "[3,   135] train_loss: 0.908 train_accuracy: 0.701 test_accuracy: 0.537\n",
            "[3,   140] train_loss: 0.824 train_accuracy: 0.691 test_accuracy: 0.533\n",
            "[3,   145] train_loss: 0.888 train_accuracy: 0.693 test_accuracy: 0.525\n",
            "[3,   150] train_loss: 0.929 train_accuracy: 0.706 test_accuracy: 0.531\n",
            "[3,   155] train_loss: 0.862 train_accuracy: 0.697 test_accuracy: 0.528\n",
            "[3,   160] train_loss: 0.885 train_accuracy: 0.698 test_accuracy: 0.529\n",
            "[3,   165] train_loss: 1.059 train_accuracy: 0.705 test_accuracy: 0.534\n",
            "[3,   170] train_loss: 0.870 train_accuracy: 0.709 test_accuracy: 0.538\n",
            "[3,   175] train_loss: 0.985 train_accuracy: 0.705 test_accuracy: 0.535\n",
            "[3,   180] train_loss: 0.902 train_accuracy: 0.710 test_accuracy: 0.537\n",
            "[3,   185] train_loss: 0.842 train_accuracy: 0.702 test_accuracy: 0.531\n",
            "[3,   190] train_loss: 0.885 train_accuracy: 0.702 test_accuracy: 0.532\n",
            "[3,   195] train_loss: 0.891 train_accuracy: 0.698 test_accuracy: 0.537\n",
            "[3,   200] train_loss: 0.777 train_accuracy: 0.697 test_accuracy: 0.530\n",
            "[3,   205] train_loss: 0.806 train_accuracy: 0.700 test_accuracy: 0.535\n",
            "[3,   210] train_loss: 0.800 train_accuracy: 0.701 test_accuracy: 0.533\n",
            "[3,   215] train_loss: 0.996 train_accuracy: 0.701 test_accuracy: 0.533\n",
            "[3,   220] train_loss: 0.859 train_accuracy: 0.690 test_accuracy: 0.530\n",
            "[3,   225] train_loss: 0.964 train_accuracy: 0.684 test_accuracy: 0.530\n",
            "[3,   230] train_loss: 0.790 train_accuracy: 0.691 test_accuracy: 0.536\n",
            "[3,   235] train_loss: 0.979 train_accuracy: 0.695 test_accuracy: 0.530\n",
            "[3,   240] train_loss: 0.939 train_accuracy: 0.698 test_accuracy: 0.529\n",
            "[3,   245] train_loss: 0.914 train_accuracy: 0.698 test_accuracy: 0.528\n",
            "[3,   250] train_loss: 1.038 train_accuracy: 0.701 test_accuracy: 0.530\n",
            "[3,   255] train_loss: 0.914 train_accuracy: 0.693 test_accuracy: 0.528\n",
            "[3,   260] train_loss: 0.752 train_accuracy: 0.688 test_accuracy: 0.526\n",
            "[3,   265] train_loss: 0.819 train_accuracy: 0.691 test_accuracy: 0.528\n",
            "[3,   270] train_loss: 1.104 train_accuracy: 0.693 test_accuracy: 0.531\n",
            "[3,   275] train_loss: 0.821 train_accuracy: 0.704 test_accuracy: 0.535\n",
            "[3,   280] train_loss: 0.814 train_accuracy: 0.699 test_accuracy: 0.536\n",
            "[3,   285] train_loss: 0.954 train_accuracy: 0.699 test_accuracy: 0.534\n",
            "[3,   290] train_loss: 0.812 train_accuracy: 0.714 test_accuracy: 0.541\n",
            "[3,   295] train_loss: 0.878 train_accuracy: 0.711 test_accuracy: 0.532\n",
            "[3,   300] train_loss: 0.809 train_accuracy: 0.699 test_accuracy: 0.531\n",
            "[3,   305] train_loss: 0.820 train_accuracy: 0.696 test_accuracy: 0.526\n",
            "[3,   310] train_loss: 0.748 train_accuracy: 0.701 test_accuracy: 0.529\n",
            "[3,   315] train_loss: 0.956 train_accuracy: 0.695 test_accuracy: 0.525\n",
            "[3,   320] train_loss: 0.957 train_accuracy: 0.695 test_accuracy: 0.528\n",
            "[3,   325] train_loss: 0.921 train_accuracy: 0.699 test_accuracy: 0.533\n",
            "[3,   330] train_loss: 0.822 train_accuracy: 0.692 test_accuracy: 0.526\n",
            "[3,   335] train_loss: 0.883 train_accuracy: 0.701 test_accuracy: 0.528\n",
            "[3,   340] train_loss: 0.825 train_accuracy: 0.691 test_accuracy: 0.527\n",
            "[3,   345] train_loss: 0.978 train_accuracy: 0.691 test_accuracy: 0.529\n",
            "[3,   350] train_loss: 0.877 train_accuracy: 0.699 test_accuracy: 0.533\n",
            "[3,   355] train_loss: 0.898 train_accuracy: 0.687 test_accuracy: 0.525\n",
            "[3,   360] train_loss: 1.053 train_accuracy: 0.693 test_accuracy: 0.529\n",
            "[3,   365] train_loss: 0.843 train_accuracy: 0.697 test_accuracy: 0.529\n",
            "[3,   370] train_loss: 0.914 train_accuracy: 0.695 test_accuracy: 0.530\n",
            "[3,   375] train_loss: 0.807 train_accuracy: 0.701 test_accuracy: 0.528\n",
            "[3,   380] train_loss: 0.757 train_accuracy: 0.701 test_accuracy: 0.529\n",
            "[3,   385] train_loss: 0.964 train_accuracy: 0.702 test_accuracy: 0.531\n",
            "[3,   390] train_loss: 0.929 train_accuracy: 0.705 test_accuracy: 0.532\n",
            "[3,   395] train_loss: 0.818 train_accuracy: 0.692 test_accuracy: 0.530\n",
            "[3,   400] train_loss: 0.934 train_accuracy: 0.688 test_accuracy: 0.518\n",
            "[3,   405] train_loss: 0.951 train_accuracy: 0.690 test_accuracy: 0.527\n",
            "[3,   410] train_loss: 1.075 train_accuracy: 0.698 test_accuracy: 0.528\n",
            "[3,   415] train_loss: 0.859 train_accuracy: 0.693 test_accuracy: 0.526\n",
            "[3,   420] train_loss: 0.928 train_accuracy: 0.698 test_accuracy: 0.531\n",
            "[3,   425] train_loss: 0.907 train_accuracy: 0.687 test_accuracy: 0.522\n",
            "[3,   430] train_loss: 1.006 train_accuracy: 0.679 test_accuracy: 0.518\n",
            "[3,   435] train_loss: 1.129 train_accuracy: 0.680 test_accuracy: 0.519\n",
            "[3,   440] train_loss: 0.992 train_accuracy: 0.695 test_accuracy: 0.522\n",
            "[3,   445] train_loss: 0.918 train_accuracy: 0.687 test_accuracy: 0.518\n",
            "[3,   450] train_loss: 0.901 train_accuracy: 0.691 test_accuracy: 0.526\n",
            "[3,   455] train_loss: 0.964 train_accuracy: 0.694 test_accuracy: 0.528\n",
            "[3,   460] train_loss: 0.947 train_accuracy: 0.693 test_accuracy: 0.523\n",
            "[3,   465] train_loss: 0.856 train_accuracy: 0.695 test_accuracy: 0.531\n",
            "[3,   470] train_loss: 0.933 train_accuracy: 0.697 test_accuracy: 0.531\n",
            "[3,   475] train_loss: 0.835 train_accuracy: 0.697 test_accuracy: 0.531\n",
            "[3,   480] train_loss: 0.873 train_accuracy: 0.695 test_accuracy: 0.529\n",
            "[3,   485] train_loss: 0.861 train_accuracy: 0.684 test_accuracy: 0.523\n",
            "[3,   490] train_loss: 1.011 train_accuracy: 0.692 test_accuracy: 0.529\n",
            "[3,   495] train_loss: 0.901 train_accuracy: 0.687 test_accuracy: 0.524\n",
            "[3,   500] train_loss: 1.086 train_accuracy: 0.698 test_accuracy: 0.528\n",
            "[3,   505] train_loss: 0.916 train_accuracy: 0.693 test_accuracy: 0.529\n",
            "[3,   510] train_loss: 1.049 train_accuracy: 0.700 test_accuracy: 0.538\n",
            "[3,   515] train_loss: 0.840 train_accuracy: 0.700 test_accuracy: 0.536\n",
            "[3,   520] train_loss: 0.935 train_accuracy: 0.688 test_accuracy: 0.524\n",
            "[3,   525] train_loss: 0.979 train_accuracy: 0.691 test_accuracy: 0.525\n",
            "[3,   530] train_loss: 0.893 train_accuracy: 0.693 test_accuracy: 0.528\n",
            "[3,   535] train_loss: 0.871 train_accuracy: 0.705 test_accuracy: 0.534\n",
            "[3,   540] train_loss: 0.833 train_accuracy: 0.699 test_accuracy: 0.531\n",
            "[3,   545] train_loss: 0.947 train_accuracy: 0.689 test_accuracy: 0.525\n",
            "[3,   550] train_loss: 0.978 train_accuracy: 0.693 test_accuracy: 0.527\n",
            "[3,   555] train_loss: 0.972 train_accuracy: 0.686 test_accuracy: 0.525\n",
            "[3,   560] train_loss: 1.011 train_accuracy: 0.673 test_accuracy: 0.518\n",
            "[3,   565] train_loss: 0.898 train_accuracy: 0.685 test_accuracy: 0.524\n",
            "[3,   570] train_loss: 0.868 train_accuracy: 0.682 test_accuracy: 0.525\n",
            "[3,   575] train_loss: 0.997 train_accuracy: 0.696 test_accuracy: 0.529\n",
            "[3,   580] train_loss: 0.872 train_accuracy: 0.698 test_accuracy: 0.529\n",
            "[3,   585] train_loss: 0.906 train_accuracy: 0.695 test_accuracy: 0.526\n",
            "[3,   590] train_loss: 0.852 train_accuracy: 0.685 test_accuracy: 0.522\n",
            "[3,   595] train_loss: 0.988 train_accuracy: 0.673 test_accuracy: 0.508\n",
            "[3,   600] train_loss: 0.891 train_accuracy: 0.688 test_accuracy: 0.519\n",
            "[3,   605] train_loss: 0.769 train_accuracy: 0.690 test_accuracy: 0.523\n",
            "[3,   610] train_loss: 0.851 train_accuracy: 0.687 test_accuracy: 0.520\n",
            "[3,   615] train_loss: 1.027 train_accuracy: 0.694 test_accuracy: 0.523\n",
            "[3,   620] train_loss: 0.949 train_accuracy: 0.702 test_accuracy: 0.526\n",
            "[3,   625] train_loss: 0.969 train_accuracy: 0.705 test_accuracy: 0.529\n",
            "[3,   630] train_loss: 0.925 train_accuracy: 0.709 test_accuracy: 0.533\n",
            "[3,   635] train_loss: 0.762 train_accuracy: 0.706 test_accuracy: 0.532\n",
            "[3,   640] train_loss: 0.955 train_accuracy: 0.701 test_accuracy: 0.529\n",
            "[3,   645] train_loss: 0.917 train_accuracy: 0.701 test_accuracy: 0.532\n",
            "[3,   650] train_loss: 0.937 train_accuracy: 0.703 test_accuracy: 0.533\n",
            "[3,   655] train_loss: 0.954 train_accuracy: 0.705 test_accuracy: 0.538\n",
            "[3,   660] train_loss: 0.834 train_accuracy: 0.699 test_accuracy: 0.533\n",
            "[3,   665] train_loss: 0.966 train_accuracy: 0.697 test_accuracy: 0.532\n",
            "[3,   670] train_loss: 0.844 train_accuracy: 0.696 test_accuracy: 0.534\n",
            "[3,   675] train_loss: 0.885 train_accuracy: 0.694 test_accuracy: 0.533\n",
            "[3,   680] train_loss: 0.786 train_accuracy: 0.692 test_accuracy: 0.530\n",
            "[3,   685] train_loss: 0.867 train_accuracy: 0.699 test_accuracy: 0.530\n",
            "[3,   690] train_loss: 0.947 train_accuracy: 0.701 test_accuracy: 0.534\n",
            "[3,   695] train_loss: 0.921 train_accuracy: 0.689 test_accuracy: 0.521\n",
            "[3,   700] train_loss: 0.911 train_accuracy: 0.689 test_accuracy: 0.521\n",
            "[3,   705] train_loss: 0.884 train_accuracy: 0.693 test_accuracy: 0.525\n",
            "[3,   710] train_loss: 1.106 train_accuracy: 0.691 test_accuracy: 0.527\n",
            "[3,   715] train_loss: 0.832 train_accuracy: 0.690 test_accuracy: 0.528\n",
            "[3,   720] train_loss: 0.883 train_accuracy: 0.686 test_accuracy: 0.525\n",
            "[3,   725] train_loss: 1.003 train_accuracy: 0.700 test_accuracy: 0.533\n",
            "[3,   730] train_loss: 0.791 train_accuracy: 0.699 test_accuracy: 0.535\n",
            "[3,   735] train_loss: 0.809 train_accuracy: 0.698 test_accuracy: 0.533\n",
            "[3,   740] train_loss: 0.849 train_accuracy: 0.697 test_accuracy: 0.533\n",
            "[3,   745] train_loss: 0.957 train_accuracy: 0.693 test_accuracy: 0.534\n",
            "[3,   750] train_loss: 1.187 train_accuracy: 0.708 test_accuracy: 0.541\n",
            "[3,   755] train_loss: 0.923 train_accuracy: 0.686 test_accuracy: 0.526\n",
            "[3,   760] train_loss: 1.014 train_accuracy: 0.688 test_accuracy: 0.524\n",
            "[3,   765] train_loss: 0.957 train_accuracy: 0.689 test_accuracy: 0.524\n",
            "[3,   770] train_loss: 1.107 train_accuracy: 0.695 test_accuracy: 0.531\n",
            "[3,   775] train_loss: 0.921 train_accuracy: 0.693 test_accuracy: 0.532\n",
            "[3,   780] train_loss: 0.929 train_accuracy: 0.700 test_accuracy: 0.533\n",
            "[3,   785] train_loss: 0.825 train_accuracy: 0.704 test_accuracy: 0.533\n",
            "[3,   790] train_loss: 0.869 train_accuracy: 0.693 test_accuracy: 0.527\n",
            "[3,   795] train_loss: 0.835 train_accuracy: 0.691 test_accuracy: 0.525\n",
            "[3,   800] train_loss: 1.003 train_accuracy: 0.688 test_accuracy: 0.524\n",
            "[3,   805] train_loss: 0.975 train_accuracy: 0.701 test_accuracy: 0.533\n",
            "[3,   810] train_loss: 0.846 train_accuracy: 0.700 test_accuracy: 0.533\n",
            "[3,   815] train_loss: 1.019 train_accuracy: 0.708 test_accuracy: 0.537\n",
            "[3,   820] train_loss: 0.951 train_accuracy: 0.706 test_accuracy: 0.536\n",
            "[3,   825] train_loss: 0.822 train_accuracy: 0.696 test_accuracy: 0.527\n",
            "[3,   830] train_loss: 0.996 train_accuracy: 0.709 test_accuracy: 0.538\n",
            "[3,   835] train_loss: 0.953 train_accuracy: 0.705 test_accuracy: 0.531\n",
            "[3,   840] train_loss: 1.021 train_accuracy: 0.704 test_accuracy: 0.533\n",
            "[3,   845] train_loss: 0.956 train_accuracy: 0.701 test_accuracy: 0.536\n",
            "[3,   850] train_loss: 0.922 train_accuracy: 0.696 test_accuracy: 0.535\n",
            "[3,   855] train_loss: 0.953 train_accuracy: 0.712 test_accuracy: 0.534\n",
            "[3,   860] train_loss: 0.831 train_accuracy: 0.701 test_accuracy: 0.530\n",
            "[3,   865] train_loss: 1.059 train_accuracy: 0.704 test_accuracy: 0.530\n",
            "[3,   870] train_loss: 0.944 train_accuracy: 0.714 test_accuracy: 0.540\n",
            "[3,   875] train_loss: 0.778 train_accuracy: 0.715 test_accuracy: 0.538\n",
            "[3,   880] train_loss: 0.919 train_accuracy: 0.712 test_accuracy: 0.540\n",
            "[3,   885] train_loss: 0.884 train_accuracy: 0.709 test_accuracy: 0.537\n",
            "[3,   890] train_loss: 0.955 train_accuracy: 0.714 test_accuracy: 0.541\n",
            "[3,   895] train_loss: 0.865 train_accuracy: 0.702 test_accuracy: 0.533\n",
            "[3,   900] train_loss: 0.866 train_accuracy: 0.701 test_accuracy: 0.534\n",
            "[3,   905] train_loss: 0.756 train_accuracy: 0.705 test_accuracy: 0.534\n",
            "[3,   910] train_loss: 0.800 train_accuracy: 0.703 test_accuracy: 0.534\n",
            "[3,   915] train_loss: 0.941 train_accuracy: 0.708 test_accuracy: 0.537\n",
            "[3,   920] train_loss: 1.075 train_accuracy: 0.709 test_accuracy: 0.531\n",
            "[3,   925] train_loss: 0.892 train_accuracy: 0.700 test_accuracy: 0.526\n",
            "[3,   930] train_loss: 0.779 train_accuracy: 0.701 test_accuracy: 0.528\n",
            "[3,   935] train_loss: 0.930 train_accuracy: 0.702 test_accuracy: 0.531\n",
            "[3,   940] train_loss: 0.766 train_accuracy: 0.691 test_accuracy: 0.526\n",
            "[3,   945] train_loss: 1.131 train_accuracy: 0.705 test_accuracy: 0.528\n",
            "[3,   950] train_loss: 1.005 train_accuracy: 0.693 test_accuracy: 0.517\n",
            "[3,   955] train_loss: 1.025 train_accuracy: 0.698 test_accuracy: 0.531\n",
            "[3,   960] train_loss: 0.953 train_accuracy: 0.695 test_accuracy: 0.527\n",
            "[3,   965] train_loss: 1.028 train_accuracy: 0.704 test_accuracy: 0.533\n",
            "[3,   970] train_loss: 0.917 train_accuracy: 0.710 test_accuracy: 0.537\n",
            "[3,   975] train_loss: 0.781 train_accuracy: 0.712 test_accuracy: 0.535\n",
            "[3,   980] train_loss: 0.866 train_accuracy: 0.699 test_accuracy: 0.524\n",
            "[3,   985] train_loss: 0.879 train_accuracy: 0.701 test_accuracy: 0.524\n",
            "[3,   990] train_loss: 0.883 train_accuracy: 0.701 test_accuracy: 0.525\n",
            "[3,   995] train_loss: 0.981 train_accuracy: 0.690 test_accuracy: 0.518\n",
            "[3,  1000] train_loss: 0.954 train_accuracy: 0.706 test_accuracy: 0.530\n",
            "[3,  1005] train_loss: 0.865 train_accuracy: 0.697 test_accuracy: 0.522\n",
            "[3,  1010] train_loss: 1.197 train_accuracy: 0.688 test_accuracy: 0.521\n",
            "[3,  1015] train_loss: 1.043 train_accuracy: 0.692 test_accuracy: 0.516\n",
            "[3,  1020] train_loss: 0.919 train_accuracy: 0.680 test_accuracy: 0.501\n",
            "[3,  1025] train_loss: 0.940 train_accuracy: 0.699 test_accuracy: 0.519\n",
            "[3,  1030] train_loss: 1.105 train_accuracy: 0.690 test_accuracy: 0.520\n",
            "[3,  1035] train_loss: 0.892 train_accuracy: 0.685 test_accuracy: 0.515\n",
            "[3,  1040] train_loss: 0.991 train_accuracy: 0.694 test_accuracy: 0.519\n",
            "[3,  1045] train_loss: 0.987 train_accuracy: 0.686 test_accuracy: 0.516\n",
            "[3,  1050] train_loss: 0.947 train_accuracy: 0.685 test_accuracy: 0.510\n",
            "[3,  1055] train_loss: 0.857 train_accuracy: 0.712 test_accuracy: 0.530\n",
            "[3,  1060] train_loss: 0.889 train_accuracy: 0.715 test_accuracy: 0.528\n",
            "[3,  1065] train_loss: 0.854 train_accuracy: 0.718 test_accuracy: 0.533\n",
            "[3,  1070] train_loss: 1.004 train_accuracy: 0.714 test_accuracy: 0.529\n",
            "[3,  1075] train_loss: 1.007 train_accuracy: 0.714 test_accuracy: 0.531\n",
            "[3,  1080] train_loss: 0.870 train_accuracy: 0.708 test_accuracy: 0.527\n",
            "[3,  1085] train_loss: 0.889 train_accuracy: 0.700 test_accuracy: 0.520\n",
            "[3,  1090] train_loss: 1.012 train_accuracy: 0.695 test_accuracy: 0.514\n",
            "[3,  1095] train_loss: 0.905 train_accuracy: 0.699 test_accuracy: 0.517\n",
            "[3,  1100] train_loss: 0.953 train_accuracy: 0.696 test_accuracy: 0.520\n",
            "[3,  1105] train_loss: 1.035 train_accuracy: 0.690 test_accuracy: 0.519\n",
            "[3,  1110] train_loss: 1.100 train_accuracy: 0.696 test_accuracy: 0.527\n",
            "[3,  1115] train_loss: 0.987 train_accuracy: 0.692 test_accuracy: 0.524\n",
            "[3,  1120] train_loss: 1.030 train_accuracy: 0.692 test_accuracy: 0.527\n",
            "[3,  1125] train_loss: 0.892 train_accuracy: 0.697 test_accuracy: 0.524\n",
            "[3,  1130] train_loss: 0.847 train_accuracy: 0.710 test_accuracy: 0.530\n",
            "[3,  1135] train_loss: 0.953 train_accuracy: 0.715 test_accuracy: 0.533\n",
            "[3,  1140] train_loss: 0.909 train_accuracy: 0.714 test_accuracy: 0.536\n",
            "[3,  1145] train_loss: 0.910 train_accuracy: 0.709 test_accuracy: 0.530\n",
            "[3,  1150] train_loss: 1.052 train_accuracy: 0.704 test_accuracy: 0.524\n",
            "[3,  1155] train_loss: 0.770 train_accuracy: 0.703 test_accuracy: 0.519\n",
            "[3,  1160] train_loss: 0.813 train_accuracy: 0.692 test_accuracy: 0.515\n",
            "[3,  1165] train_loss: 1.009 train_accuracy: 0.704 test_accuracy: 0.523\n",
            "[3,  1170] train_loss: 0.912 train_accuracy: 0.703 test_accuracy: 0.528\n",
            "[3,  1175] train_loss: 0.943 train_accuracy: 0.697 test_accuracy: 0.524\n",
            "[3,  1180] train_loss: 0.852 train_accuracy: 0.708 test_accuracy: 0.527\n",
            "[3,  1185] train_loss: 0.913 train_accuracy: 0.709 test_accuracy: 0.527\n",
            "[3,  1190] train_loss: 0.870 train_accuracy: 0.709 test_accuracy: 0.530\n",
            "[3,  1195] train_loss: 0.904 train_accuracy: 0.706 test_accuracy: 0.533\n",
            "[3,  1200] train_loss: 0.953 train_accuracy: 0.702 test_accuracy: 0.532\n",
            "[3,  1205] train_loss: 0.895 train_accuracy: 0.698 test_accuracy: 0.528\n",
            "[3,  1210] train_loss: 0.903 train_accuracy: 0.685 test_accuracy: 0.523\n",
            "[3,  1215] train_loss: 0.923 train_accuracy: 0.695 test_accuracy: 0.522\n",
            "[3,  1220] train_loss: 0.835 train_accuracy: 0.706 test_accuracy: 0.524\n",
            "[3,  1225] train_loss: 0.910 train_accuracy: 0.707 test_accuracy: 0.529\n",
            "[3,  1230] train_loss: 0.936 train_accuracy: 0.700 test_accuracy: 0.522\n",
            "[3,  1235] train_loss: 0.772 train_accuracy: 0.703 test_accuracy: 0.527\n",
            "[3,  1240] train_loss: 1.018 train_accuracy: 0.710 test_accuracy: 0.528\n",
            "[3,  1245] train_loss: 0.992 train_accuracy: 0.711 test_accuracy: 0.532\n",
            "[4,     5] train_loss: 0.798 train_accuracy: 0.713 test_accuracy: 0.535\n",
            "[4,    10] train_loss: 0.770 train_accuracy: 0.705 test_accuracy: 0.537\n",
            "[4,    15] train_loss: 0.675 train_accuracy: 0.699 test_accuracy: 0.536\n",
            "[4,    20] train_loss: 0.887 train_accuracy: 0.708 test_accuracy: 0.534\n",
            "[4,    25] train_loss: 0.881 train_accuracy: 0.715 test_accuracy: 0.536\n",
            "[4,    30] train_loss: 0.815 train_accuracy: 0.712 test_accuracy: 0.530\n",
            "[4,    35] train_loss: 0.958 train_accuracy: 0.709 test_accuracy: 0.525\n",
            "[4,    40] train_loss: 0.768 train_accuracy: 0.713 test_accuracy: 0.523\n",
            "[4,    45] train_loss: 0.903 train_accuracy: 0.708 test_accuracy: 0.522\n",
            "[4,    50] train_loss: 0.978 train_accuracy: 0.704 test_accuracy: 0.518\n",
            "[4,    55] train_loss: 0.834 train_accuracy: 0.705 test_accuracy: 0.523\n",
            "[4,    60] train_loss: 0.891 train_accuracy: 0.707 test_accuracy: 0.528\n",
            "[4,    65] train_loss: 0.799 train_accuracy: 0.704 test_accuracy: 0.514\n",
            "[4,    70] train_loss: 0.855 train_accuracy: 0.708 test_accuracy: 0.528\n",
            "[4,    75] train_loss: 0.842 train_accuracy: 0.706 test_accuracy: 0.524\n",
            "[4,    80] train_loss: 1.049 train_accuracy: 0.708 test_accuracy: 0.527\n",
            "[4,    85] train_loss: 0.835 train_accuracy: 0.701 test_accuracy: 0.523\n",
            "[4,    90] train_loss: 0.793 train_accuracy: 0.713 test_accuracy: 0.526\n",
            "[4,    95] train_loss: 0.857 train_accuracy: 0.714 test_accuracy: 0.528\n",
            "[4,   100] train_loss: 0.809 train_accuracy: 0.708 test_accuracy: 0.526\n",
            "[4,   105] train_loss: 0.912 train_accuracy: 0.709 test_accuracy: 0.526\n",
            "[4,   110] train_loss: 0.816 train_accuracy: 0.707 test_accuracy: 0.527\n",
            "[4,   115] train_loss: 0.943 train_accuracy: 0.710 test_accuracy: 0.531\n",
            "[4,   120] train_loss: 0.813 train_accuracy: 0.707 test_accuracy: 0.529\n",
            "[4,   125] train_loss: 0.938 train_accuracy: 0.704 test_accuracy: 0.523\n",
            "[4,   130] train_loss: 0.846 train_accuracy: 0.693 test_accuracy: 0.513\n",
            "[4,   135] train_loss: 0.900 train_accuracy: 0.696 test_accuracy: 0.519\n",
            "[4,   140] train_loss: 0.718 train_accuracy: 0.702 test_accuracy: 0.520\n",
            "[4,   145] train_loss: 0.871 train_accuracy: 0.702 test_accuracy: 0.519\n",
            "[4,   150] train_loss: 0.767 train_accuracy: 0.706 test_accuracy: 0.523\n",
            "[4,   155] train_loss: 0.870 train_accuracy: 0.703 test_accuracy: 0.531\n",
            "[4,   160] train_loss: 0.893 train_accuracy: 0.704 test_accuracy: 0.523\n",
            "[4,   165] train_loss: 0.917 train_accuracy: 0.711 test_accuracy: 0.523\n",
            "[4,   170] train_loss: 0.910 train_accuracy: 0.710 test_accuracy: 0.529\n",
            "[4,   175] train_loss: 0.777 train_accuracy: 0.703 test_accuracy: 0.529\n",
            "[4,   180] train_loss: 0.821 train_accuracy: 0.708 test_accuracy: 0.535\n",
            "[4,   185] train_loss: 0.943 train_accuracy: 0.718 test_accuracy: 0.531\n",
            "[4,   190] train_loss: 0.941 train_accuracy: 0.706 test_accuracy: 0.525\n",
            "[4,   195] train_loss: 0.882 train_accuracy: 0.684 test_accuracy: 0.512\n",
            "[4,   200] train_loss: 1.134 train_accuracy: 0.690 test_accuracy: 0.517\n",
            "[4,   205] train_loss: 0.942 train_accuracy: 0.701 test_accuracy: 0.522\n",
            "[4,   210] train_loss: 0.788 train_accuracy: 0.689 test_accuracy: 0.520\n",
            "[4,   215] train_loss: 0.907 train_accuracy: 0.701 test_accuracy: 0.525\n",
            "[4,   220] train_loss: 0.888 train_accuracy: 0.708 test_accuracy: 0.529\n",
            "[4,   225] train_loss: 0.951 train_accuracy: 0.707 test_accuracy: 0.529\n",
            "[4,   230] train_loss: 0.882 train_accuracy: 0.714 test_accuracy: 0.534\n",
            "[4,   235] train_loss: 0.793 train_accuracy: 0.710 test_accuracy: 0.535\n",
            "[4,   240] train_loss: 0.899 train_accuracy: 0.711 test_accuracy: 0.527\n",
            "[4,   245] train_loss: 0.733 train_accuracy: 0.708 test_accuracy: 0.529\n",
            "[4,   250] train_loss: 0.790 train_accuracy: 0.711 test_accuracy: 0.533\n",
            "[4,   255] train_loss: 0.863 train_accuracy: 0.706 test_accuracy: 0.530\n",
            "[4,   260] train_loss: 0.843 train_accuracy: 0.714 test_accuracy: 0.528\n",
            "[4,   265] train_loss: 0.956 train_accuracy: 0.706 test_accuracy: 0.519\n",
            "[4,   270] train_loss: 0.810 train_accuracy: 0.683 test_accuracy: 0.506\n",
            "[4,   275] train_loss: 1.223 train_accuracy: 0.691 test_accuracy: 0.510\n",
            "[4,   280] train_loss: 0.899 train_accuracy: 0.682 test_accuracy: 0.511\n",
            "[4,   285] train_loss: 0.968 train_accuracy: 0.696 test_accuracy: 0.519\n",
            "[4,   290] train_loss: 0.917 train_accuracy: 0.702 test_accuracy: 0.526\n",
            "[4,   295] train_loss: 0.899 train_accuracy: 0.694 test_accuracy: 0.518\n",
            "[4,   300] train_loss: 0.980 train_accuracy: 0.702 test_accuracy: 0.525\n",
            "[4,   305] train_loss: 0.976 train_accuracy: 0.705 test_accuracy: 0.526\n",
            "[4,   310] train_loss: 0.849 train_accuracy: 0.711 test_accuracy: 0.526\n",
            "[4,   315] train_loss: 0.902 train_accuracy: 0.717 test_accuracy: 0.533\n",
            "[4,   320] train_loss: 0.922 train_accuracy: 0.705 test_accuracy: 0.530\n",
            "[4,   325] train_loss: 0.809 train_accuracy: 0.709 test_accuracy: 0.533\n",
            "[4,   330] train_loss: 0.812 train_accuracy: 0.714 test_accuracy: 0.537\n",
            "[4,   335] train_loss: 0.905 train_accuracy: 0.710 test_accuracy: 0.534\n",
            "[4,   340] train_loss: 0.907 train_accuracy: 0.700 test_accuracy: 0.528\n",
            "[4,   345] train_loss: 0.991 train_accuracy: 0.698 test_accuracy: 0.527\n",
            "[4,   350] train_loss: 0.813 train_accuracy: 0.702 test_accuracy: 0.529\n",
            "[4,   355] train_loss: 0.878 train_accuracy: 0.713 test_accuracy: 0.534\n",
            "[4,   360] train_loss: 0.702 train_accuracy: 0.720 test_accuracy: 0.538\n",
            "[4,   365] train_loss: 0.874 train_accuracy: 0.714 test_accuracy: 0.534\n",
            "[4,   370] train_loss: 0.764 train_accuracy: 0.704 test_accuracy: 0.528\n",
            "[4,   375] train_loss: 0.966 train_accuracy: 0.706 test_accuracy: 0.532\n",
            "[4,   380] train_loss: 0.836 train_accuracy: 0.718 test_accuracy: 0.536\n",
            "[4,   385] train_loss: 0.748 train_accuracy: 0.721 test_accuracy: 0.540\n",
            "[4,   390] train_loss: 0.890 train_accuracy: 0.715 test_accuracy: 0.534\n",
            "[4,   395] train_loss: 0.829 train_accuracy: 0.703 test_accuracy: 0.529\n",
            "[4,   400] train_loss: 0.861 train_accuracy: 0.711 test_accuracy: 0.534\n",
            "[4,   405] train_loss: 0.912 train_accuracy: 0.715 test_accuracy: 0.535\n",
            "[4,   410] train_loss: 0.828 train_accuracy: 0.714 test_accuracy: 0.532\n",
            "[4,   415] train_loss: 0.821 train_accuracy: 0.703 test_accuracy: 0.529\n",
            "[4,   420] train_loss: 0.834 train_accuracy: 0.707 test_accuracy: 0.531\n",
            "[4,   425] train_loss: 0.826 train_accuracy: 0.699 test_accuracy: 0.525\n",
            "[4,   430] train_loss: 0.806 train_accuracy: 0.718 test_accuracy: 0.530\n",
            "[4,   435] train_loss: 0.922 train_accuracy: 0.722 test_accuracy: 0.538\n",
            "[4,   440] train_loss: 0.813 train_accuracy: 0.727 test_accuracy: 0.542\n",
            "[4,   445] train_loss: 0.814 train_accuracy: 0.732 test_accuracy: 0.544\n",
            "[4,   450] train_loss: 0.829 train_accuracy: 0.728 test_accuracy: 0.540\n",
            "[4,   455] train_loss: 0.860 train_accuracy: 0.721 test_accuracy: 0.536\n",
            "[4,   460] train_loss: 1.002 train_accuracy: 0.713 test_accuracy: 0.532\n",
            "[4,   465] train_loss: 0.829 train_accuracy: 0.724 test_accuracy: 0.538\n",
            "[4,   470] train_loss: 0.874 train_accuracy: 0.715 test_accuracy: 0.528\n",
            "[4,   475] train_loss: 0.920 train_accuracy: 0.720 test_accuracy: 0.530\n",
            "[4,   480] train_loss: 0.969 train_accuracy: 0.712 test_accuracy: 0.531\n",
            "[4,   485] train_loss: 0.842 train_accuracy: 0.721 test_accuracy: 0.533\n",
            "[4,   490] train_loss: 0.789 train_accuracy: 0.711 test_accuracy: 0.527\n",
            "[4,   495] train_loss: 0.857 train_accuracy: 0.705 test_accuracy: 0.523\n",
            "[4,   500] train_loss: 0.959 train_accuracy: 0.717 test_accuracy: 0.529\n",
            "[4,   505] train_loss: 0.885 train_accuracy: 0.709 test_accuracy: 0.530\n",
            "[4,   510] train_loss: 0.947 train_accuracy: 0.698 test_accuracy: 0.521\n",
            "[4,   515] train_loss: 0.895 train_accuracy: 0.712 test_accuracy: 0.528\n",
            "[4,   520] train_loss: 0.827 train_accuracy: 0.709 test_accuracy: 0.527\n",
            "[4,   525] train_loss: 0.885 train_accuracy: 0.716 test_accuracy: 0.535\n",
            "[4,   530] train_loss: 0.887 train_accuracy: 0.721 test_accuracy: 0.533\n",
            "[4,   535] train_loss: 0.847 train_accuracy: 0.717 test_accuracy: 0.532\n",
            "[4,   540] train_loss: 0.906 train_accuracy: 0.718 test_accuracy: 0.534\n",
            "[4,   545] train_loss: 0.857 train_accuracy: 0.716 test_accuracy: 0.528\n",
            "[4,   550] train_loss: 0.794 train_accuracy: 0.712 test_accuracy: 0.526\n",
            "[4,   555] train_loss: 0.904 train_accuracy: 0.706 test_accuracy: 0.526\n",
            "[4,   560] train_loss: 0.863 train_accuracy: 0.694 test_accuracy: 0.519\n",
            "[4,   565] train_loss: 1.033 train_accuracy: 0.714 test_accuracy: 0.535\n",
            "[4,   570] train_loss: 0.802 train_accuracy: 0.703 test_accuracy: 0.531\n",
            "[4,   575] train_loss: 0.820 train_accuracy: 0.695 test_accuracy: 0.525\n",
            "[4,   580] train_loss: 0.909 train_accuracy: 0.706 test_accuracy: 0.533\n",
            "[4,   585] train_loss: 0.888 train_accuracy: 0.713 test_accuracy: 0.534\n",
            "[4,   590] train_loss: 0.898 train_accuracy: 0.708 test_accuracy: 0.531\n",
            "[4,   595] train_loss: 0.990 train_accuracy: 0.706 test_accuracy: 0.531\n",
            "[4,   600] train_loss: 0.954 train_accuracy: 0.708 test_accuracy: 0.532\n",
            "[4,   605] train_loss: 0.817 train_accuracy: 0.713 test_accuracy: 0.533\n",
            "[4,   610] train_loss: 0.824 train_accuracy: 0.716 test_accuracy: 0.532\n",
            "[4,   615] train_loss: 0.939 train_accuracy: 0.726 test_accuracy: 0.539\n",
            "[4,   620] train_loss: 0.737 train_accuracy: 0.715 test_accuracy: 0.524\n",
            "[4,   625] train_loss: 0.870 train_accuracy: 0.713 test_accuracy: 0.523\n",
            "[4,   630] train_loss: 0.800 train_accuracy: 0.701 test_accuracy: 0.516\n",
            "[4,   635] train_loss: 0.937 train_accuracy: 0.715 test_accuracy: 0.521\n",
            "[4,   640] train_loss: 0.943 train_accuracy: 0.723 test_accuracy: 0.530\n",
            "[4,   645] train_loss: 0.785 train_accuracy: 0.723 test_accuracy: 0.533\n",
            "[4,   650] train_loss: 0.811 train_accuracy: 0.721 test_accuracy: 0.536\n",
            "[4,   655] train_loss: 0.925 train_accuracy: 0.718 test_accuracy: 0.537\n",
            "[4,   660] train_loss: 0.757 train_accuracy: 0.714 test_accuracy: 0.533\n",
            "[4,   665] train_loss: 0.887 train_accuracy: 0.722 test_accuracy: 0.536\n",
            "[4,   670] train_loss: 0.969 train_accuracy: 0.711 test_accuracy: 0.530\n",
            "[4,   675] train_loss: 0.860 train_accuracy: 0.708 test_accuracy: 0.526\n",
            "[4,   680] train_loss: 0.846 train_accuracy: 0.711 test_accuracy: 0.528\n",
            "[4,   685] train_loss: 0.894 train_accuracy: 0.710 test_accuracy: 0.530\n",
            "[4,   690] train_loss: 0.848 train_accuracy: 0.721 test_accuracy: 0.536\n",
            "[4,   695] train_loss: 0.839 train_accuracy: 0.716 test_accuracy: 0.532\n",
            "[4,   700] train_loss: 0.802 train_accuracy: 0.714 test_accuracy: 0.523\n",
            "[4,   705] train_loss: 0.855 train_accuracy: 0.704 test_accuracy: 0.517\n",
            "[4,   710] train_loss: 0.832 train_accuracy: 0.699 test_accuracy: 0.516\n",
            "[4,   715] train_loss: 0.928 train_accuracy: 0.713 test_accuracy: 0.523\n",
            "[4,   720] train_loss: 0.762 train_accuracy: 0.717 test_accuracy: 0.529\n",
            "[4,   725] train_loss: 0.806 train_accuracy: 0.716 test_accuracy: 0.531\n",
            "[4,   730] train_loss: 0.835 train_accuracy: 0.710 test_accuracy: 0.530\n",
            "[4,   735] train_loss: 0.869 train_accuracy: 0.709 test_accuracy: 0.528\n",
            "[4,   740] train_loss: 0.859 train_accuracy: 0.716 test_accuracy: 0.530\n",
            "[4,   745] train_loss: 1.040 train_accuracy: 0.724 test_accuracy: 0.534\n",
            "[4,   750] train_loss: 0.780 train_accuracy: 0.712 test_accuracy: 0.533\n",
            "[4,   755] train_loss: 0.851 train_accuracy: 0.720 test_accuracy: 0.539\n",
            "[4,   760] train_loss: 0.954 train_accuracy: 0.732 test_accuracy: 0.540\n",
            "[4,   765] train_loss: 0.768 train_accuracy: 0.721 test_accuracy: 0.534\n",
            "[4,   770] train_loss: 0.768 train_accuracy: 0.707 test_accuracy: 0.525\n",
            "[4,   775] train_loss: 1.007 train_accuracy: 0.720 test_accuracy: 0.533\n",
            "[4,   780] train_loss: 0.761 train_accuracy: 0.730 test_accuracy: 0.538\n",
            "[4,   785] train_loss: 0.828 train_accuracy: 0.729 test_accuracy: 0.538\n",
            "[4,   790] train_loss: 0.781 train_accuracy: 0.714 test_accuracy: 0.536\n",
            "[4,   795] train_loss: 0.855 train_accuracy: 0.707 test_accuracy: 0.531\n",
            "[4,   800] train_loss: 0.919 train_accuracy: 0.724 test_accuracy: 0.534\n",
            "[4,   805] train_loss: 0.935 train_accuracy: 0.706 test_accuracy: 0.527\n",
            "[4,   810] train_loss: 0.860 train_accuracy: 0.709 test_accuracy: 0.527\n",
            "[4,   815] train_loss: 0.796 train_accuracy: 0.711 test_accuracy: 0.530\n",
            "[4,   820] train_loss: 1.059 train_accuracy: 0.715 test_accuracy: 0.536\n",
            "[4,   825] train_loss: 0.836 train_accuracy: 0.709 test_accuracy: 0.531\n",
            "[4,   830] train_loss: 0.796 train_accuracy: 0.707 test_accuracy: 0.531\n",
            "[4,   835] train_loss: 0.893 train_accuracy: 0.715 test_accuracy: 0.532\n",
            "[4,   840] train_loss: 0.879 train_accuracy: 0.713 test_accuracy: 0.528\n",
            "[4,   845] train_loss: 0.840 train_accuracy: 0.708 test_accuracy: 0.528\n",
            "[4,   850] train_loss: 1.020 train_accuracy: 0.711 test_accuracy: 0.530\n",
            "[4,   855] train_loss: 0.995 train_accuracy: 0.711 test_accuracy: 0.525\n",
            "[4,   860] train_loss: 0.893 train_accuracy: 0.710 test_accuracy: 0.529\n",
            "[4,   865] train_loss: 0.917 train_accuracy: 0.714 test_accuracy: 0.527\n",
            "[4,   870] train_loss: 0.962 train_accuracy: 0.723 test_accuracy: 0.533\n",
            "[4,   875] train_loss: 0.776 train_accuracy: 0.719 test_accuracy: 0.533\n",
            "[4,   880] train_loss: 0.992 train_accuracy: 0.726 test_accuracy: 0.535\n",
            "[4,   885] train_loss: 0.980 train_accuracy: 0.724 test_accuracy: 0.535\n",
            "[4,   890] train_loss: 0.972 train_accuracy: 0.723 test_accuracy: 0.531\n",
            "[4,   895] train_loss: 0.894 train_accuracy: 0.726 test_accuracy: 0.533\n",
            "[4,   900] train_loss: 0.934 train_accuracy: 0.729 test_accuracy: 0.539\n",
            "[4,   905] train_loss: 0.999 train_accuracy: 0.724 test_accuracy: 0.535\n",
            "[4,   910] train_loss: 0.884 train_accuracy: 0.719 test_accuracy: 0.533\n",
            "[4,   915] train_loss: 0.894 train_accuracy: 0.708 test_accuracy: 0.528\n",
            "[4,   920] train_loss: 0.997 train_accuracy: 0.697 test_accuracy: 0.523\n",
            "[4,   925] train_loss: 0.987 train_accuracy: 0.711 test_accuracy: 0.532\n",
            "[4,   930] train_loss: 0.936 train_accuracy: 0.718 test_accuracy: 0.537\n",
            "[4,   935] train_loss: 0.956 train_accuracy: 0.712 test_accuracy: 0.530\n",
            "[4,   940] train_loss: 0.884 train_accuracy: 0.711 test_accuracy: 0.528\n",
            "[4,   945] train_loss: 0.887 train_accuracy: 0.724 test_accuracy: 0.538\n",
            "[4,   950] train_loss: 0.844 train_accuracy: 0.717 test_accuracy: 0.534\n",
            "[4,   955] train_loss: 0.956 train_accuracy: 0.717 test_accuracy: 0.533\n",
            "[4,   960] train_loss: 0.871 train_accuracy: 0.727 test_accuracy: 0.536\n",
            "[4,   965] train_loss: 0.864 train_accuracy: 0.723 test_accuracy: 0.532\n",
            "[4,   970] train_loss: 0.839 train_accuracy: 0.731 test_accuracy: 0.535\n",
            "[4,   975] train_loss: 1.001 train_accuracy: 0.717 test_accuracy: 0.530\n",
            "[4,   980] train_loss: 0.895 train_accuracy: 0.714 test_accuracy: 0.532\n",
            "[4,   985] train_loss: 0.819 train_accuracy: 0.719 test_accuracy: 0.532\n",
            "[4,   990] train_loss: 0.867 train_accuracy: 0.717 test_accuracy: 0.531\n",
            "[4,   995] train_loss: 0.822 train_accuracy: 0.718 test_accuracy: 0.528\n",
            "[4,  1000] train_loss: 0.983 train_accuracy: 0.724 test_accuracy: 0.534\n",
            "[4,  1005] train_loss: 0.882 train_accuracy: 0.718 test_accuracy: 0.534\n",
            "[4,  1010] train_loss: 0.766 train_accuracy: 0.708 test_accuracy: 0.529\n",
            "[4,  1015] train_loss: 0.804 train_accuracy: 0.708 test_accuracy: 0.532\n",
            "[4,  1020] train_loss: 1.030 train_accuracy: 0.711 test_accuracy: 0.521\n",
            "[4,  1025] train_loss: 0.832 train_accuracy: 0.701 test_accuracy: 0.519\n",
            "[4,  1030] train_loss: 0.791 train_accuracy: 0.699 test_accuracy: 0.512\n",
            "[4,  1035] train_loss: 0.831 train_accuracy: 0.708 test_accuracy: 0.520\n",
            "[4,  1040] train_loss: 0.812 train_accuracy: 0.711 test_accuracy: 0.520\n",
            "[4,  1045] train_loss: 0.789 train_accuracy: 0.715 test_accuracy: 0.531\n",
            "[4,  1050] train_loss: 0.958 train_accuracy: 0.710 test_accuracy: 0.535\n",
            "[4,  1055] train_loss: 0.749 train_accuracy: 0.710 test_accuracy: 0.533\n",
            "[4,  1060] train_loss: 0.942 train_accuracy: 0.708 test_accuracy: 0.534\n",
            "[4,  1065] train_loss: 0.908 train_accuracy: 0.721 test_accuracy: 0.541\n",
            "[4,  1070] train_loss: 0.823 train_accuracy: 0.710 test_accuracy: 0.533\n",
            "[4,  1075] train_loss: 1.011 train_accuracy: 0.718 test_accuracy: 0.536\n",
            "[4,  1080] train_loss: 0.849 train_accuracy: 0.727 test_accuracy: 0.539\n",
            "[4,  1085] train_loss: 0.788 train_accuracy: 0.724 test_accuracy: 0.539\n",
            "[4,  1090] train_loss: 0.756 train_accuracy: 0.721 test_accuracy: 0.538\n",
            "[4,  1095] train_loss: 0.852 train_accuracy: 0.725 test_accuracy: 0.539\n",
            "[4,  1100] train_loss: 0.779 train_accuracy: 0.719 test_accuracy: 0.533\n",
            "[4,  1105] train_loss: 0.960 train_accuracy: 0.717 test_accuracy: 0.531\n",
            "[4,  1110] train_loss: 0.825 train_accuracy: 0.728 test_accuracy: 0.534\n",
            "[4,  1115] train_loss: 0.769 train_accuracy: 0.720 test_accuracy: 0.533\n",
            "[4,  1120] train_loss: 1.017 train_accuracy: 0.721 test_accuracy: 0.536\n",
            "[4,  1125] train_loss: 0.862 train_accuracy: 0.726 test_accuracy: 0.533\n",
            "[4,  1130] train_loss: 0.853 train_accuracy: 0.731 test_accuracy: 0.536\n",
            "[4,  1135] train_loss: 0.785 train_accuracy: 0.726 test_accuracy: 0.538\n",
            "[4,  1140] train_loss: 0.817 train_accuracy: 0.722 test_accuracy: 0.534\n",
            "[4,  1145] train_loss: 0.875 train_accuracy: 0.723 test_accuracy: 0.539\n",
            "[4,  1150] train_loss: 0.934 train_accuracy: 0.724 test_accuracy: 0.532\n",
            "[4,  1155] train_loss: 1.035 train_accuracy: 0.708 test_accuracy: 0.525\n",
            "[4,  1160] train_loss: 0.875 train_accuracy: 0.701 test_accuracy: 0.519\n",
            "[4,  1165] train_loss: 0.905 train_accuracy: 0.687 test_accuracy: 0.511\n",
            "[4,  1170] train_loss: 0.899 train_accuracy: 0.708 test_accuracy: 0.527\n",
            "[4,  1175] train_loss: 0.849 train_accuracy: 0.706 test_accuracy: 0.530\n",
            "[4,  1180] train_loss: 0.902 train_accuracy: 0.704 test_accuracy: 0.524\n",
            "[4,  1185] train_loss: 0.938 train_accuracy: 0.710 test_accuracy: 0.521\n",
            "[4,  1190] train_loss: 0.893 train_accuracy: 0.714 test_accuracy: 0.523\n",
            "[4,  1195] train_loss: 0.830 train_accuracy: 0.730 test_accuracy: 0.532\n",
            "[4,  1200] train_loss: 0.917 train_accuracy: 0.733 test_accuracy: 0.535\n",
            "[4,  1205] train_loss: 0.827 train_accuracy: 0.727 test_accuracy: 0.532\n",
            "[4,  1210] train_loss: 0.906 train_accuracy: 0.720 test_accuracy: 0.535\n",
            "[4,  1215] train_loss: 0.914 train_accuracy: 0.731 test_accuracy: 0.542\n",
            "[4,  1220] train_loss: 0.871 train_accuracy: 0.714 test_accuracy: 0.531\n",
            "[4,  1225] train_loss: 0.970 train_accuracy: 0.694 test_accuracy: 0.518\n",
            "[4,  1230] train_loss: 0.902 train_accuracy: 0.709 test_accuracy: 0.524\n",
            "[4,  1235] train_loss: 0.940 train_accuracy: 0.695 test_accuracy: 0.517\n",
            "[4,  1240] train_loss: 0.983 train_accuracy: 0.688 test_accuracy: 0.524\n",
            "[4,  1245] train_loss: 0.932 train_accuracy: 0.715 test_accuracy: 0.534\n",
            "[5,     5] train_loss: 0.811 train_accuracy: 0.720 test_accuracy: 0.533\n",
            "[5,    10] train_loss: 0.817 train_accuracy: 0.718 test_accuracy: 0.531\n",
            "[5,    15] train_loss: 0.953 train_accuracy: 0.716 test_accuracy: 0.534\n",
            "[5,    20] train_loss: 0.937 train_accuracy: 0.718 test_accuracy: 0.536\n",
            "[5,    25] train_loss: 0.798 train_accuracy: 0.724 test_accuracy: 0.535\n",
            "[5,    30] train_loss: 0.778 train_accuracy: 0.723 test_accuracy: 0.539\n",
            "[5,    35] train_loss: 0.713 train_accuracy: 0.726 test_accuracy: 0.537\n",
            "[5,    40] train_loss: 0.722 train_accuracy: 0.728 test_accuracy: 0.539\n",
            "[5,    45] train_loss: 0.642 train_accuracy: 0.727 test_accuracy: 0.537\n",
            "[5,    50] train_loss: 0.709 train_accuracy: 0.728 test_accuracy: 0.536\n",
            "[5,    55] train_loss: 0.778 train_accuracy: 0.734 test_accuracy: 0.539\n",
            "[5,    60] train_loss: 0.762 train_accuracy: 0.733 test_accuracy: 0.542\n",
            "[5,    65] train_loss: 0.689 train_accuracy: 0.724 test_accuracy: 0.537\n",
            "[5,    70] train_loss: 0.748 train_accuracy: 0.733 test_accuracy: 0.541\n",
            "[5,    75] train_loss: 0.767 train_accuracy: 0.737 test_accuracy: 0.541\n",
            "[5,    80] train_loss: 0.831 train_accuracy: 0.728 test_accuracy: 0.539\n",
            "[5,    85] train_loss: 0.699 train_accuracy: 0.724 test_accuracy: 0.536\n",
            "[5,    90] train_loss: 0.763 train_accuracy: 0.721 test_accuracy: 0.534\n",
            "[5,    95] train_loss: 0.805 train_accuracy: 0.726 test_accuracy: 0.531\n",
            "[5,   100] train_loss: 0.761 train_accuracy: 0.722 test_accuracy: 0.537\n",
            "[5,   105] train_loss: 0.663 train_accuracy: 0.727 test_accuracy: 0.536\n",
            "[5,   110] train_loss: 0.793 train_accuracy: 0.718 test_accuracy: 0.531\n",
            "[5,   115] train_loss: 0.831 train_accuracy: 0.729 test_accuracy: 0.541\n",
            "[5,   120] train_loss: 0.856 train_accuracy: 0.723 test_accuracy: 0.539\n",
            "[5,   125] train_loss: 0.756 train_accuracy: 0.721 test_accuracy: 0.534\n",
            "[5,   130] train_loss: 0.677 train_accuracy: 0.720 test_accuracy: 0.535\n",
            "[5,   135] train_loss: 0.898 train_accuracy: 0.721 test_accuracy: 0.531\n",
            "[5,   140] train_loss: 0.884 train_accuracy: 0.716 test_accuracy: 0.529\n",
            "[5,   145] train_loss: 0.809 train_accuracy: 0.711 test_accuracy: 0.525\n",
            "[5,   150] train_loss: 0.957 train_accuracy: 0.710 test_accuracy: 0.518\n",
            "[5,   155] train_loss: 0.844 train_accuracy: 0.718 test_accuracy: 0.522\n",
            "[5,   160] train_loss: 0.793 train_accuracy: 0.708 test_accuracy: 0.519\n",
            "[5,   165] train_loss: 0.801 train_accuracy: 0.703 test_accuracy: 0.519\n",
            "[5,   170] train_loss: 0.878 train_accuracy: 0.711 test_accuracy: 0.527\n",
            "[5,   175] train_loss: 0.935 train_accuracy: 0.715 test_accuracy: 0.531\n",
            "[5,   180] train_loss: 0.822 train_accuracy: 0.718 test_accuracy: 0.530\n",
            "[5,   185] train_loss: 0.873 train_accuracy: 0.720 test_accuracy: 0.537\n",
            "[5,   190] train_loss: 0.974 train_accuracy: 0.723 test_accuracy: 0.535\n",
            "[5,   195] train_loss: 0.892 train_accuracy: 0.718 test_accuracy: 0.527\n",
            "[5,   200] train_loss: 0.891 train_accuracy: 0.720 test_accuracy: 0.525\n",
            "[5,   205] train_loss: 0.720 train_accuracy: 0.716 test_accuracy: 0.534\n",
            "[5,   210] train_loss: 0.845 train_accuracy: 0.718 test_accuracy: 0.532\n",
            "[5,   215] train_loss: 0.865 train_accuracy: 0.706 test_accuracy: 0.518\n",
            "[5,   220] train_loss: 0.862 train_accuracy: 0.709 test_accuracy: 0.520\n",
            "[5,   225] train_loss: 0.929 train_accuracy: 0.701 test_accuracy: 0.514\n",
            "[5,   230] train_loss: 0.940 train_accuracy: 0.705 test_accuracy: 0.529\n",
            "[5,   235] train_loss: 0.915 train_accuracy: 0.706 test_accuracy: 0.521\n",
            "[5,   240] train_loss: 0.922 train_accuracy: 0.700 test_accuracy: 0.513\n",
            "[5,   245] train_loss: 0.819 train_accuracy: 0.716 test_accuracy: 0.526\n",
            "[5,   250] train_loss: 0.847 train_accuracy: 0.719 test_accuracy: 0.531\n",
            "[5,   255] train_loss: 0.777 train_accuracy: 0.721 test_accuracy: 0.531\n",
            "[5,   260] train_loss: 0.820 train_accuracy: 0.720 test_accuracy: 0.534\n",
            "[5,   265] train_loss: 0.730 train_accuracy: 0.723 test_accuracy: 0.536\n",
            "[5,   270] train_loss: 0.920 train_accuracy: 0.722 test_accuracy: 0.531\n",
            "[5,   275] train_loss: 0.891 train_accuracy: 0.726 test_accuracy: 0.530\n",
            "[5,   280] train_loss: 0.851 train_accuracy: 0.729 test_accuracy: 0.530\n",
            "[5,   285] train_loss: 0.810 train_accuracy: 0.722 test_accuracy: 0.529\n",
            "[5,   290] train_loss: 0.853 train_accuracy: 0.716 test_accuracy: 0.523\n",
            "[5,   295] train_loss: 0.870 train_accuracy: 0.726 test_accuracy: 0.530\n",
            "[5,   300] train_loss: 0.773 train_accuracy: 0.717 test_accuracy: 0.523\n",
            "[5,   305] train_loss: 0.874 train_accuracy: 0.713 test_accuracy: 0.524\n",
            "[5,   310] train_loss: 0.717 train_accuracy: 0.725 test_accuracy: 0.536\n",
            "[5,   315] train_loss: 0.844 train_accuracy: 0.713 test_accuracy: 0.530\n",
            "[5,   320] train_loss: 1.020 train_accuracy: 0.723 test_accuracy: 0.530\n",
            "[5,   325] train_loss: 0.751 train_accuracy: 0.723 test_accuracy: 0.528\n",
            "[5,   330] train_loss: 0.891 train_accuracy: 0.725 test_accuracy: 0.528\n",
            "[5,   335] train_loss: 0.811 train_accuracy: 0.713 test_accuracy: 0.527\n",
            "[5,   340] train_loss: 1.007 train_accuracy: 0.719 test_accuracy: 0.530\n",
            "[5,   345] train_loss: 0.779 train_accuracy: 0.712 test_accuracy: 0.521\n",
            "[5,   350] train_loss: 0.913 train_accuracy: 0.714 test_accuracy: 0.519\n",
            "[5,   355] train_loss: 0.871 train_accuracy: 0.725 test_accuracy: 0.521\n",
            "[5,   360] train_loss: 0.936 train_accuracy: 0.722 test_accuracy: 0.525\n",
            "[5,   365] train_loss: 0.764 train_accuracy: 0.729 test_accuracy: 0.533\n",
            "[5,   370] train_loss: 0.935 train_accuracy: 0.722 test_accuracy: 0.529\n",
            "[5,   375] train_loss: 0.805 train_accuracy: 0.725 test_accuracy: 0.527\n",
            "[5,   380] train_loss: 0.750 train_accuracy: 0.733 test_accuracy: 0.536\n",
            "[5,   385] train_loss: 0.770 train_accuracy: 0.722 test_accuracy: 0.529\n",
            "[5,   390] train_loss: 0.773 train_accuracy: 0.718 test_accuracy: 0.527\n",
            "[5,   395] train_loss: 0.862 train_accuracy: 0.722 test_accuracy: 0.522\n",
            "[5,   400] train_loss: 0.898 train_accuracy: 0.716 test_accuracy: 0.518\n",
            "[5,   405] train_loss: 0.858 train_accuracy: 0.720 test_accuracy: 0.527\n",
            "[5,   410] train_loss: 0.789 train_accuracy: 0.727 test_accuracy: 0.533\n",
            "[5,   415] train_loss: 0.755 train_accuracy: 0.729 test_accuracy: 0.532\n",
            "[5,   420] train_loss: 0.816 train_accuracy: 0.726 test_accuracy: 0.538\n",
            "[5,   425] train_loss: 0.820 train_accuracy: 0.725 test_accuracy: 0.539\n",
            "[5,   430] train_loss: 0.954 train_accuracy: 0.729 test_accuracy: 0.537\n",
            "[5,   435] train_loss: 0.885 train_accuracy: 0.737 test_accuracy: 0.534\n",
            "[5,   440] train_loss: 0.673 train_accuracy: 0.728 test_accuracy: 0.530\n",
            "[5,   445] train_loss: 0.758 train_accuracy: 0.725 test_accuracy: 0.532\n",
            "[5,   450] train_loss: 0.792 train_accuracy: 0.715 test_accuracy: 0.526\n",
            "[5,   455] train_loss: 0.793 train_accuracy: 0.724 test_accuracy: 0.528\n",
            "[5,   460] train_loss: 1.001 train_accuracy: 0.721 test_accuracy: 0.530\n",
            "[5,   465] train_loss: 0.973 train_accuracy: 0.709 test_accuracy: 0.523\n",
            "[5,   470] train_loss: 0.817 train_accuracy: 0.721 test_accuracy: 0.532\n",
            "[5,   475] train_loss: 0.706 train_accuracy: 0.727 test_accuracy: 0.538\n",
            "[5,   480] train_loss: 0.809 train_accuracy: 0.726 test_accuracy: 0.541\n",
            "[5,   485] train_loss: 0.944 train_accuracy: 0.720 test_accuracy: 0.537\n",
            "[5,   490] train_loss: 0.911 train_accuracy: 0.723 test_accuracy: 0.533\n",
            "[5,   495] train_loss: 0.876 train_accuracy: 0.712 test_accuracy: 0.528\n",
            "[5,   500] train_loss: 0.844 train_accuracy: 0.719 test_accuracy: 0.528\n",
            "[5,   505] train_loss: 0.795 train_accuracy: 0.722 test_accuracy: 0.529\n",
            "[5,   510] train_loss: 0.840 train_accuracy: 0.714 test_accuracy: 0.528\n",
            "[5,   515] train_loss: 0.869 train_accuracy: 0.724 test_accuracy: 0.530\n",
            "[5,   520] train_loss: 0.905 train_accuracy: 0.727 test_accuracy: 0.531\n",
            "[5,   525] train_loss: 0.800 train_accuracy: 0.724 test_accuracy: 0.528\n",
            "[5,   530] train_loss: 0.934 train_accuracy: 0.730 test_accuracy: 0.533\n",
            "[5,   535] train_loss: 0.773 train_accuracy: 0.712 test_accuracy: 0.522\n",
            "[5,   540] train_loss: 0.917 train_accuracy: 0.724 test_accuracy: 0.536\n",
            "[5,   545] train_loss: 0.890 train_accuracy: 0.718 test_accuracy: 0.528\n",
            "[5,   550] train_loss: 0.703 train_accuracy: 0.721 test_accuracy: 0.530\n",
            "[5,   555] train_loss: 0.808 train_accuracy: 0.732 test_accuracy: 0.536\n",
            "[5,   560] train_loss: 0.808 train_accuracy: 0.719 test_accuracy: 0.527\n",
            "[5,   565] train_loss: 0.685 train_accuracy: 0.718 test_accuracy: 0.529\n",
            "[5,   570] train_loss: 0.806 train_accuracy: 0.727 test_accuracy: 0.537\n",
            "[5,   575] train_loss: 0.961 train_accuracy: 0.724 test_accuracy: 0.535\n",
            "[5,   580] train_loss: 0.703 train_accuracy: 0.710 test_accuracy: 0.529\n",
            "[5,   585] train_loss: 0.960 train_accuracy: 0.712 test_accuracy: 0.525\n",
            "[5,   590] train_loss: 0.981 train_accuracy: 0.723 test_accuracy: 0.526\n",
            "[5,   595] train_loss: 0.982 train_accuracy: 0.722 test_accuracy: 0.522\n",
            "[5,   600] train_loss: 0.990 train_accuracy: 0.718 test_accuracy: 0.532\n",
            "[5,   605] train_loss: 0.955 train_accuracy: 0.715 test_accuracy: 0.530\n",
            "[5,   610] train_loss: 0.751 train_accuracy: 0.725 test_accuracy: 0.530\n",
            "[5,   615] train_loss: 0.869 train_accuracy: 0.721 test_accuracy: 0.523\n",
            "[5,   620] train_loss: 0.983 train_accuracy: 0.724 test_accuracy: 0.525\n",
            "[5,   625] train_loss: 0.934 train_accuracy: 0.726 test_accuracy: 0.521\n",
            "[5,   630] train_loss: 0.731 train_accuracy: 0.715 test_accuracy: 0.517\n",
            "[5,   635] train_loss: 0.874 train_accuracy: 0.729 test_accuracy: 0.514\n",
            "[5,   640] train_loss: 0.785 train_accuracy: 0.725 test_accuracy: 0.521\n",
            "[5,   645] train_loss: 0.824 train_accuracy: 0.721 test_accuracy: 0.519\n",
            "[5,   650] train_loss: 0.855 train_accuracy: 0.734 test_accuracy: 0.526\n",
            "[5,   655] train_loss: 0.816 train_accuracy: 0.719 test_accuracy: 0.521\n",
            "[5,   660] train_loss: 1.013 train_accuracy: 0.718 test_accuracy: 0.521\n",
            "[5,   665] train_loss: 0.861 train_accuracy: 0.729 test_accuracy: 0.533\n",
            "[5,   670] train_loss: 0.894 train_accuracy: 0.738 test_accuracy: 0.534\n",
            "[5,   675] train_loss: 0.852 train_accuracy: 0.739 test_accuracy: 0.536\n",
            "[5,   680] train_loss: 0.748 train_accuracy: 0.728 test_accuracy: 0.527\n",
            "[5,   685] train_loss: 0.794 train_accuracy: 0.723 test_accuracy: 0.526\n",
            "[5,   690] train_loss: 0.762 train_accuracy: 0.732 test_accuracy: 0.534\n",
            "[5,   695] train_loss: 0.821 train_accuracy: 0.724 test_accuracy: 0.531\n",
            "[5,   700] train_loss: 0.772 train_accuracy: 0.724 test_accuracy: 0.528\n",
            "[5,   705] train_loss: 0.782 train_accuracy: 0.710 test_accuracy: 0.515\n",
            "[5,   710] train_loss: 0.794 train_accuracy: 0.730 test_accuracy: 0.528\n",
            "[5,   715] train_loss: 0.919 train_accuracy: 0.716 test_accuracy: 0.527\n",
            "[5,   720] train_loss: 0.749 train_accuracy: 0.715 test_accuracy: 0.524\n",
            "[5,   725] train_loss: 0.904 train_accuracy: 0.727 test_accuracy: 0.531\n",
            "[5,   730] train_loss: 1.021 train_accuracy: 0.724 test_accuracy: 0.524\n",
            "[5,   735] train_loss: 1.001 train_accuracy: 0.721 test_accuracy: 0.524\n",
            "[5,   740] train_loss: 0.864 train_accuracy: 0.715 test_accuracy: 0.520\n",
            "[5,   745] train_loss: 0.872 train_accuracy: 0.720 test_accuracy: 0.524\n",
            "[5,   750] train_loss: 0.894 train_accuracy: 0.736 test_accuracy: 0.531\n",
            "[5,   755] train_loss: 0.832 train_accuracy: 0.734 test_accuracy: 0.531\n",
            "[5,   760] train_loss: 0.905 train_accuracy: 0.732 test_accuracy: 0.527\n",
            "[5,   765] train_loss: 0.885 train_accuracy: 0.730 test_accuracy: 0.525\n",
            "[5,   770] train_loss: 0.844 train_accuracy: 0.733 test_accuracy: 0.533\n",
            "[5,   775] train_loss: 1.016 train_accuracy: 0.719 test_accuracy: 0.523\n",
            "[5,   780] train_loss: 0.882 train_accuracy: 0.730 test_accuracy: 0.533\n",
            "[5,   785] train_loss: 0.858 train_accuracy: 0.730 test_accuracy: 0.528\n",
            "[5,   790] train_loss: 0.912 train_accuracy: 0.728 test_accuracy: 0.524\n",
            "[5,   795] train_loss: 0.822 train_accuracy: 0.727 test_accuracy: 0.530\n",
            "[5,   800] train_loss: 0.836 train_accuracy: 0.723 test_accuracy: 0.530\n",
            "[5,   805] train_loss: 0.739 train_accuracy: 0.731 test_accuracy: 0.528\n",
            "[5,   810] train_loss: 0.751 train_accuracy: 0.729 test_accuracy: 0.527\n",
            "[5,   815] train_loss: 0.920 train_accuracy: 0.723 test_accuracy: 0.528\n",
            "[5,   820] train_loss: 0.925 train_accuracy: 0.725 test_accuracy: 0.531\n",
            "[5,   825] train_loss: 0.957 train_accuracy: 0.725 test_accuracy: 0.526\n",
            "[5,   830] train_loss: 0.918 train_accuracy: 0.726 test_accuracy: 0.520\n",
            "[5,   835] train_loss: 0.901 train_accuracy: 0.725 test_accuracy: 0.522\n",
            "[5,   840] train_loss: 0.844 train_accuracy: 0.726 test_accuracy: 0.532\n",
            "[5,   845] train_loss: 0.967 train_accuracy: 0.731 test_accuracy: 0.525\n",
            "[5,   850] train_loss: 0.833 train_accuracy: 0.722 test_accuracy: 0.525\n",
            "[5,   855] train_loss: 0.853 train_accuracy: 0.727 test_accuracy: 0.528\n",
            "[5,   860] train_loss: 0.881 train_accuracy: 0.729 test_accuracy: 0.521\n",
            "[5,   865] train_loss: 0.938 train_accuracy: 0.720 test_accuracy: 0.517\n",
            "[5,   870] train_loss: 0.828 train_accuracy: 0.729 test_accuracy: 0.526\n",
            "[5,   875] train_loss: 0.909 train_accuracy: 0.721 test_accuracy: 0.522\n",
            "[5,   880] train_loss: 0.729 train_accuracy: 0.723 test_accuracy: 0.532\n",
            "[5,   885] train_loss: 0.854 train_accuracy: 0.727 test_accuracy: 0.534\n",
            "[5,   890] train_loss: 0.826 train_accuracy: 0.728 test_accuracy: 0.533\n",
            "[5,   895] train_loss: 0.797 train_accuracy: 0.722 test_accuracy: 0.526\n",
            "[5,   900] train_loss: 0.979 train_accuracy: 0.727 test_accuracy: 0.531\n",
            "[5,   905] train_loss: 0.891 train_accuracy: 0.734 test_accuracy: 0.533\n",
            "[5,   910] train_loss: 0.728 train_accuracy: 0.728 test_accuracy: 0.528\n",
            "[5,   915] train_loss: 0.875 train_accuracy: 0.722 test_accuracy: 0.524\n",
            "[5,   920] train_loss: 0.930 train_accuracy: 0.729 test_accuracy: 0.533\n",
            "[5,   925] train_loss: 0.907 train_accuracy: 0.727 test_accuracy: 0.532\n",
            "[5,   930] train_loss: 0.865 train_accuracy: 0.724 test_accuracy: 0.525\n",
            "[5,   935] train_loss: 0.871 train_accuracy: 0.728 test_accuracy: 0.532\n",
            "[5,   940] train_loss: 0.817 train_accuracy: 0.727 test_accuracy: 0.529\n",
            "[5,   945] train_loss: 0.745 train_accuracy: 0.727 test_accuracy: 0.527\n",
            "[5,   950] train_loss: 0.804 train_accuracy: 0.722 test_accuracy: 0.525\n",
            "[5,   955] train_loss: 0.873 train_accuracy: 0.722 test_accuracy: 0.526\n",
            "[5,   960] train_loss: 0.835 train_accuracy: 0.730 test_accuracy: 0.535\n",
            "[5,   965] train_loss: 0.813 train_accuracy: 0.728 test_accuracy: 0.537\n",
            "[5,   970] train_loss: 0.823 train_accuracy: 0.720 test_accuracy: 0.533\n",
            "[5,   975] train_loss: 1.031 train_accuracy: 0.718 test_accuracy: 0.528\n",
            "[5,   980] train_loss: 0.966 train_accuracy: 0.708 test_accuracy: 0.515\n",
            "[5,   985] train_loss: 0.916 train_accuracy: 0.730 test_accuracy: 0.527\n",
            "[5,   990] train_loss: 0.731 train_accuracy: 0.727 test_accuracy: 0.534\n",
            "[5,   995] train_loss: 0.872 train_accuracy: 0.724 test_accuracy: 0.527\n",
            "[5,  1000] train_loss: 0.853 train_accuracy: 0.725 test_accuracy: 0.530\n",
            "[5,  1005] train_loss: 0.898 train_accuracy: 0.742 test_accuracy: 0.534\n",
            "[5,  1010] train_loss: 0.865 train_accuracy: 0.723 test_accuracy: 0.522\n",
            "[5,  1015] train_loss: 0.789 train_accuracy: 0.719 test_accuracy: 0.520\n",
            "[5,  1020] train_loss: 0.919 train_accuracy: 0.733 test_accuracy: 0.534\n",
            "[5,  1025] train_loss: 0.797 train_accuracy: 0.721 test_accuracy: 0.528\n",
            "[5,  1030] train_loss: 0.840 train_accuracy: 0.736 test_accuracy: 0.530\n",
            "[5,  1035] train_loss: 0.800 train_accuracy: 0.721 test_accuracy: 0.520\n",
            "[5,  1040] train_loss: 0.852 train_accuracy: 0.723 test_accuracy: 0.523\n",
            "[5,  1045] train_loss: 0.877 train_accuracy: 0.732 test_accuracy: 0.535\n",
            "[5,  1050] train_loss: 0.965 train_accuracy: 0.734 test_accuracy: 0.535\n",
            "[5,  1055] train_loss: 0.830 train_accuracy: 0.739 test_accuracy: 0.538\n",
            "[5,  1060] train_loss: 0.720 train_accuracy: 0.733 test_accuracy: 0.536\n",
            "[5,  1065] train_loss: 0.733 train_accuracy: 0.737 test_accuracy: 0.537\n",
            "[5,  1070] train_loss: 0.803 train_accuracy: 0.727 test_accuracy: 0.533\n",
            "[5,  1075] train_loss: 1.000 train_accuracy: 0.720 test_accuracy: 0.527\n",
            "[5,  1080] train_loss: 0.801 train_accuracy: 0.713 test_accuracy: 0.521\n",
            "[5,  1085] train_loss: 0.733 train_accuracy: 0.710 test_accuracy: 0.524\n",
            "[5,  1090] train_loss: 0.944 train_accuracy: 0.729 test_accuracy: 0.529\n",
            "[5,  1095] train_loss: 0.743 train_accuracy: 0.742 test_accuracy: 0.537\n",
            "[5,  1100] train_loss: 0.754 train_accuracy: 0.730 test_accuracy: 0.531\n",
            "[5,  1105] train_loss: 0.748 train_accuracy: 0.719 test_accuracy: 0.525\n",
            "[5,  1110] train_loss: 0.758 train_accuracy: 0.732 test_accuracy: 0.534\n",
            "[5,  1115] train_loss: 0.935 train_accuracy: 0.741 test_accuracy: 0.539\n",
            "[5,  1120] train_loss: 0.932 train_accuracy: 0.732 test_accuracy: 0.536\n",
            "[5,  1125] train_loss: 0.940 train_accuracy: 0.738 test_accuracy: 0.537\n",
            "[5,  1130] train_loss: 0.857 train_accuracy: 0.734 test_accuracy: 0.537\n",
            "[5,  1135] train_loss: 0.902 train_accuracy: 0.736 test_accuracy: 0.537\n",
            "[5,  1140] train_loss: 0.826 train_accuracy: 0.730 test_accuracy: 0.538\n",
            "[5,  1145] train_loss: 0.873 train_accuracy: 0.726 test_accuracy: 0.528\n",
            "[5,  1150] train_loss: 0.817 train_accuracy: 0.735 test_accuracy: 0.534\n",
            "[5,  1155] train_loss: 0.872 train_accuracy: 0.735 test_accuracy: 0.541\n",
            "[5,  1160] train_loss: 0.812 train_accuracy: 0.729 test_accuracy: 0.542\n",
            "[5,  1165] train_loss: 0.876 train_accuracy: 0.732 test_accuracy: 0.538\n",
            "[5,  1170] train_loss: 0.867 train_accuracy: 0.733 test_accuracy: 0.537\n",
            "[5,  1175] train_loss: 0.895 train_accuracy: 0.740 test_accuracy: 0.543\n",
            "[5,  1180] train_loss: 0.776 train_accuracy: 0.735 test_accuracy: 0.541\n",
            "[5,  1185] train_loss: 0.800 train_accuracy: 0.730 test_accuracy: 0.539\n",
            "[5,  1190] train_loss: 0.828 train_accuracy: 0.726 test_accuracy: 0.533\n",
            "[5,  1195] train_loss: 0.752 train_accuracy: 0.730 test_accuracy: 0.533\n",
            "[5,  1200] train_loss: 0.773 train_accuracy: 0.727 test_accuracy: 0.526\n",
            "[5,  1205] train_loss: 0.823 train_accuracy: 0.735 test_accuracy: 0.538\n",
            "[5,  1210] train_loss: 1.026 train_accuracy: 0.745 test_accuracy: 0.545\n",
            "[5,  1215] train_loss: 0.744 train_accuracy: 0.739 test_accuracy: 0.536\n",
            "[5,  1220] train_loss: 0.821 train_accuracy: 0.737 test_accuracy: 0.530\n",
            "[5,  1225] train_loss: 0.830 train_accuracy: 0.741 test_accuracy: 0.534\n",
            "[5,  1230] train_loss: 0.918 train_accuracy: 0.736 test_accuracy: 0.531\n",
            "[5,  1235] train_loss: 0.803 train_accuracy: 0.727 test_accuracy: 0.525\n",
            "[5,  1240] train_loss: 0.811 train_accuracy: 0.733 test_accuracy: 0.530\n",
            "[5,  1245] train_loss: 0.910 train_accuracy: 0.739 test_accuracy: 0.529\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "# Writing training accuracy to file\n",
        "with open('Accuracy_a_train.txt', 'w') as file:\n",
        "    for i in range(len(a_train)):\n",
        "        file.write(str(a_train[i]))\n",
        "        if i < len(a_train) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing test accuracy to file\n",
        "with open('Accuracy_a_test.txt', 'w') as file:\n",
        "    for i in range(len(a_test)):\n",
        "        file.write(str(a_test[i]))\n",
        "        if i < len(a_test) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing loss values to file\n",
        "with open('Accuracy_loss.txt', 'w') as file:\n",
        "    for i in range(len(lossaaa)):\n",
        "        file.write(str(lossaaa[i]))\n",
        "        if i < len(lossaaa) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "W9dpFrTm2tc4"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Convert tensors to lists\n",
        "Inf_list = [tensor.item() for tensor in Inf]\n",
        "Var_av_list = [tensor.item() for tensor in Var_all]\n",
        "Generalization_Ratio_list = [tensor.item() for tensor in Generalization_Ratio_]\n",
        "\n",
        "# Writing Inf_list to file\n",
        "with open('Inf_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Inf_list)):\n",
        "        file.write(str(Inf_list[i]))\n",
        "        if i < len(Inf_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Var_av_list to file\n",
        "with open('Var_all_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Var_av_list)):\n",
        "        file.write(str(Var_av_list[i]))\n",
        "        if i < len(Var_av_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Generalization_Ratio_list to file\n",
        "with open('Generalization_Ratio_list.txt', 'w') as file:\n",
        "    for i in range(len(Generalization_Ratio_list)):\n",
        "        file.write(str(Generalization_Ratio_list[i]))\n",
        "        if i < len(Generalization_Ratio_list) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "ZOcmTWKo2cK8"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import time\n",
        "import os  # Import the os module\n",
        "\n",
        "os.makedirs(os.path.join('./Models/'), exist_ok=True)  # Create the directory './Models/' if it doesn't exist\n",
        "model_path = './Models/'  # Define the model path\n",
        "\n",
        "rq = time.strftime('%Y%m%d%H%M', time.localtime(time.time()))  # Get the current time in the format 'YYYYMMDDHHMM'\n",
        "\n",
        "# Save the training results\n",
        "current_model_path = model_path + rq + \"_model.pkl\"  # Create the full path for the model file with the current timestamp\n",
        "torch.save(net, current_model_path)  # Save the model to the specified path\n",
        "print(\"Saved model file: \" + current_model_path)  # Print the path of the saved model file"
      ],
      "metadata": {
        "id": "D3dGBsxg2yRo"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Display the highest value that appears during training\n",
        "print(\"train:\", max(a_train))  # Print the highest value in the training data\n",
        "print(\"test:\", max(a_test))  # Print the highest value in the test data\n",
        "print(\"loss:\", min(lossaaa))  # Print the minimum value of the loss"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "Fl9VUwtZ2-hX",
        "outputId": "775157b1-4792-4a5b-e41c-546e26027348"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "train: 0.7451\n",
            "test: 0.5447\n",
            "loss: 0.6319445610046387\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "trainset = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "testset = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 test dataset\n",
        "trainloader = torch.utils.data.DataLoader(trainset, batch_size=50000, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "t_loader = torch.utils.data.DataLoader(testset, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "trainloader_iter = iter(trainloader)  # Create an iterator for the training DataLoader\n",
        "tl_image, tl_label = next(trainloader_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "tl_image = tl_image.cuda()  # Move training images to GPU\n",
        "tl_label = tl_label.cuda()  # Move training labels to GPU\n",
        "tl_imageoutputs = net(tl_image)  # [batch, 10]  # Get the outputs from the network for the training images\n",
        "predict_y = torch.max(tl_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy = torch.eq(predict_y, tl_label).sum().item() / tl_label.size(0)  # Calculate accuracy for the training set\n",
        "print(\"train:\", float(accuracy))  # Print the training accuracy\n",
        "\n",
        "t_data_iter = iter(t_loader)  # Create an iterator for the test DataLoader\n",
        "t_image, t_label = next(t_data_iter)  # Get the next batch of images and labels from the test DataLoader\n",
        "t_image = t_image.cuda()  # Move test images to GPU\n",
        "t_label = t_label.cuda()  # Move test labels to GPU\n",
        "t_imageoutputs = net(t_image)  # [batch, 10]  # Get the outputs from the network for the test images\n",
        "predict = torch.max(t_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy_t = torch.eq(predict, t_label).sum().item() / t_label.size(0)  # Calculate accuracy for the test set\n",
        "print(\"test:\", float(accuracy_t))  # Print the test accuracy"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "XJ1xk7UD3FSY",
        "outputId": "eb5fbaae-a24a-4cf2-80dc-61383e3aa489"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "train: 0.73598\n",
            "test: 0.5289\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### **Network2 : use linear layers and active layers (not use GDP)**"
      ],
      "metadata": {
        "id": "1nhY46erEfhp"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import argparse\n",
        "import os\n",
        "import numpy as np\n",
        "import torchvision.transforms as transforms\n",
        "from torchvision.utils import save_image\n",
        "from torch.utils.data import DataLoader\n",
        "from torchvision import datasets\n",
        "from torch.autograd import Variable\n",
        "import torch.nn as nn\n",
        "import torch\n",
        "\n",
        "class LANet(nn.Module):\n",
        "    def __init__(self):  # Initialization function\n",
        "        super(LANet, self).__init__()\n",
        "\n",
        "        self.fc1 = nn.Linear(3*32*32, 1000)  # Define the first fully connected layer\n",
        "        self.fc2 = nn.Linear(1000, 500)  # Define the second fully connected layer\n",
        "        self.fc3 = nn.Linear(500, 100)  # Define the third fully connected layer\n",
        "        self.fc4 = nn.Linear(100, 50)  # Define the fourth fully connected layer\n",
        "        self.fc5 = nn.Linear(50, 25)  # Define the fifth fully connected layer\n",
        "        self.fc6 = nn.Linear(25, 20)  # Define the sixth fully connected layer\n",
        "        self.fc7 = nn.Linear(20, 10)  # Define the seventh fully connected layer\n",
        "\n",
        "    def forward(self, x):  # Define the forward pass\n",
        "\n",
        "        x = x.view(-1, 3*32*32)  # Flatten the input tensor\n",
        "        x = F.relu(self.fc1(x))  # Apply ReLU activation after the first layer\n",
        "        x = self.fc2(x)  # Apply the second layer\n",
        "        x = F.relu(self.fc3(x))  # Apply ReLU activation after the third layer\n",
        "        x = self.fc4(x)  # Apply the fourth layer\n",
        "        x = F.relu(self.fc5(x))  # Apply ReLU activation after the fifth layer\n",
        "        x = F.relu(self.fc6(x))  # Apply ReLU activation after the sixth layer\n",
        "        x = self.fc7(x)  # Apply the seventh layer\n",
        "        return x  # Return the output\n",
        "\n",
        "loss_function = torch.nn.CrossEntropyLoss()  # Define the loss function as CrossEntropyLoss\n",
        "net = LANet()  # Instantiate the LANet model\n",
        "# If a GPU is available, run in CUDA mode\n",
        "if torch.cuda.is_available():\n",
        "    net = net.cuda()  # Move the network to the GPU\n",
        "    loss_function = loss_function.cuda()  # Move the loss function to the GPU\n",
        "optimizer_L = torch.optim.Adam(net.parameters(), lr=0.001)  # Initialize the Adam optimizer with learning rate 0.001"
      ],
      "metadata": {
        "id": "ZKCpchZJ3LbP"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import numpy as np\n",
        "import torch\n",
        "import torchvision\n",
        "import torch.nn as nn\n",
        "from matplotlib import pyplot as plt\n",
        "import random\n",
        "\n",
        "import torch.optim as optim\n",
        "import torchvision.transforms as transforms\n",
        "import time\n",
        "\n",
        "\n",
        "################################################ reload\n",
        "transform = transforms.Compose(\n",
        "    [transforms.ToTensor(),\n",
        "     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])  # Define the transformation to be applied to the images\n",
        "\n",
        "train_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "test_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)  # Load CIFAR-10 test dataset\n",
        "\n",
        "train_loader = torch.utils.data.DataLoader(train_set, batch_size=40, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "testloader = torch.utils.data.DataLoader(test_set, batch_size=40, shuffle=True, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "val_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 validation dataset\n",
        "val_loader = torch.utils.data.DataLoader(val_set, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for validation set\n",
        "val_data_iter = iter(val_loader)  # Create an iterator for the validation DataLoader\n",
        "val_image, val_label = next(val_data_iter)  # Get the next batch of images and labels from the validation DataLoader\n",
        "#print(val_image.shape)  # Print the shape of validation images\n",
        "\n",
        "##################\n",
        "tra_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=False, transform=transform)  # Load CIFAR-10 training dataset again\n",
        "tra_loader = torch.utils.data.DataLoader(tra_set, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for the training set\n",
        "tra_data_iter = iter(tra_loader)  # Create an iterator for the training DataLoader\n",
        "tra_image, tra_label = next(tra_data_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "\n",
        "##################\n",
        "classes = ('plane', 'car', 'bird', 'cat',  # Define the class labels\n",
        "           'deer', 'dog', 'frog', 'horse', 'ship', 'truck')\n",
        "\n",
        "optimizer = optim.Adam(net.parameters(), lr=0.001)  # Initialize the Adam optimizer with learning rate 0.001\n",
        "\n",
        "########################################################\n",
        "\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "from collections import Counter, defaultdict\n",
        "from itertools import combinations\n",
        "import random\n",
        "\n",
        "a_train = []  # To store training accuracy\n",
        "a_test = []  # To store test accuracy\n",
        "lossaaa = []  # To store loss values\n",
        "Inf = []  # To store information values\n",
        "Var_all = []  # To store all variation values\n",
        "Generalization_Ratio_ = []  # To store generalization ratios\n",
        "dicide_action = []  # To store decision actions\n",
        "loss_before = torch.tensor(30.0)  # Initial loss value\n",
        "los = torch.tensor(30.0)  # Initial loss value\n",
        "dis_before_A1 = torch.tensor(0)  # Distance before action A1\n",
        "dis_before_A2 = torch.tensor(0)  # Distance before action A2\n",
        "dis = torch.tensor(1)  # Distance increment\n",
        "per = \"N\"  # Previous iteration's action\n",
        "state_before = torch.tensor(0.0)  # Previous state value\n",
        "categrary_number = 10  # Number of categories\n",
        "tra_val_number = 2  # Training validation number\n",
        "\n",
        "for epoch in range(5):  # Loop over the dataset multiple times\n",
        "    e3412_iter = iter(e3412_loader)  # Iterator for e3412_loader\n",
        "    running_loss = 0.0  # Running loss\n",
        "    running_loss_all = 0.0  # Running loss for all\n",
        "    loss_before = Variable(loss_before, requires_grad=False)  # Make loss_before a variable\n",
        "    los = Variable(los, requires_grad=False)  # Make los a variable\n",
        "    state_before = Variable(state_before, requires_grad=False)  # Make state_before a variable\n",
        "    dis_before_A1 = Variable(dis_before_A1, requires_grad=False)  # Make dis_before_A1 a variable\n",
        "    dis_before_A2 = Variable(dis_before_A2, requires_grad=False)  # Make dis_before_A2 a variable\n",
        "    acc_A1 = Variable(dis_before_A1, requires_grad=False)  # Make acc_A1 a variable\n",
        "    acc_A2 = Variable(dis_before_A2, requires_grad=False)  # Make acc_A2 a variable\n",
        "    dis_ = Variable(dis, requires_grad=False)  # Make dis a variable\n",
        "\n",
        "    for step, (imgs, labels) in enumerate(e1234_loader):  # Iterate over the data\n",
        "        ### calculate losses\n",
        "        weight_val_probility = 1.0 / tra_val_number  # Weight for validation probability\n",
        "        labels = labels.cuda()  # Move labels to GPU\n",
        "        imgs = imgs.cuda()  # Move images to GPU\n",
        "        out_e1234 = net(imgs)  # Get output from the network\n",
        "        loss_out_e1234 = loss_function(out_e1234, labels)  # Calculate loss for e1234 (A1)\n",
        "\n",
        "        e3412_imgs, e3412_labels = next(e3412_iter)  # Get next batch from e3412_iter\n",
        "        e3412_imgs = e3412_imgs.cuda()  # Move e3412 images to GPU\n",
        "        e3412_labels = e3412_labels.cuda()  # Move e3412 labels to GPU\n",
        "        out_e3412 = net(e3412_imgs)  # Get output from the network\n",
        "        loss_out_e3412 = loss_function(out_e3412, e3412_labels)  # Calculate loss for e3412 (A3)\n",
        "\n",
        "        #################### extract\n",
        "        ## e1 ext count\n",
        "        e12_extracted_loader_image = e12_extracted_loader_image.cuda()  # Move e12 extracted images to GPU\n",
        "        e12_extracted_loader_label = e12_extracted_loader_label.cuda()  # Move e12 extracted labels to GPU\n",
        "        e12_extracted_out = net(e12_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e12_extracted = torch.max(e12_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ## e2 ext count\n",
        "        e34_extracted_loader_image = e34_extracted_loader_image.cuda()  # Move e34 extracted images to GPU\n",
        "        e34_extracted_loader_label = e34_extracted_loader_label.cuda()  # Move e34 extracted labels to GPU\n",
        "        e34_extracted_out = net(e34_extracted_loader_image).detach()  # Get detached output from the network\n",
        "        e34_extracted = torch.max(e34_extracted_out, dim=1)[1]  # Get max output indices\n",
        "\n",
        "        ########### e1 count\n",
        "        e12_s_loader_image = e12_s_loader_image.cuda()  # Move e12 sample images to GPU\n",
        "        e12_s_loader_label = e12_s_loader_label.cuda()  # Move e12 sample labels to GPU\n",
        "        e12_inform_out = net(e12_s_loader_image).detach()  # Get detached output from the network\n",
        "        e12_inform = torch.max(e12_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e12_inform = torch.chunk(e12_inform, 10)  # Split e12 inform into 10 chunks\n",
        "        split_e12_inform = list(split_e12_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e12_inform)):\n",
        "            counts_E12 = torch.bincount(split_e12_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e12 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e12[category] = counts_E12[category]  # Update counts\n",
        "            split_e12_inform[i] = counts_e12  # Store updated counts\n",
        "\n",
        "        ########### e2 count\n",
        "        e34_s_loader_image = e34_s_loader_image.cuda()  # Move e34 sample images to GPU\n",
        "        e34_s_loader_label = e34_s_loader_label.cuda()  # Move e34 sample labels to GPU\n",
        "        e34_inform_out = net(e34_s_loader_image).detach()  # Get detached output from the network\n",
        "        e34_inform = torch.max(e34_inform_out, dim=1)[1]  # Get max output indices\n",
        "        split_e34_inform = torch.chunk(e34_inform, 10)  # Split e34 inform into 10 chunks\n",
        "        split_e34_inform = list(split_e34_inform)  # Convert split into list\n",
        "\n",
        "        for i in range(len(split_e34_inform)):\n",
        "            counts_E34 = torch.bincount(split_e34_inform[i], minlength=10)  # Count occurrences\n",
        "            counts_e34 = torch.zeros(10)  # Initialize counts\n",
        "            for category in range(10):\n",
        "                counts_e34[category] = counts_E34[category]  # Update counts\n",
        "            split_e34_inform[i] = counts_e34  # Store updated counts\n",
        "\n",
        "        ##########\n",
        "        ## IN_IN_pro\n",
        "        counts_i_12 = torch.bincount(e12_inform, minlength=10)  # Count occurrences for e12 inform\n",
        "        counts_i_34 = torch.bincount(e34_inform, minlength=10)  # Count occurrences for e34 inform\n",
        "        counts_in_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_in_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_12[category] = counts_i_12[category]  # Update counts for e12\n",
        "        total_samples_in_12 = len(e12_inform)  # Total samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_in_34[category] = counts_i_34[category]  # Update counts for e34\n",
        "        total_samples_in_34 = len(e34_inform)  # Total samples in e34\n",
        "\n",
        "        min_denominator_in_12 = total_samples_in_12 * 1e-6  # Minimum denominator for e12\n",
        "        probabilities_in_12 = counts_in_12 / (total_samples_in_12 + min_denominator_in_12)  # Probabilities for e12\n",
        "        probabilities_tensor_in_12 = probabilities_in_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12\n",
        "\n",
        "        min_denominator_in_34 = total_samples_in_34 * 1e-6  # Minimum denominator for e34\n",
        "        probabilities_in_34 = counts_in_34 / (total_samples_in_34 + min_denominator_in_34)  # Probabilities for e34\n",
        "        probabilities_tensor_in_34 = probabilities_in_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34\n",
        "\n",
        "        counts_ext_12 = torch.bincount(e12_extracted, minlength=10)  # Count occurrences for e12 extracted\n",
        "        counts_ext_34 = torch.bincount(e34_extracted, minlength=10)  # Count occurrences for e34 extracted\n",
        "        counts_extra_12 = torch.zeros(10)  # Initialize counts\n",
        "        counts_extra_34 = torch.zeros(10)  # Initialize counts\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_12[category] = counts_ext_12[category]  # Update counts for e12 extracted\n",
        "        total_extracted_in_12 = len(e12_extracted)  # Total extracted samples in e12\n",
        "\n",
        "        for category in range(10):\n",
        "            counts_extra_34[category] = counts_ext_34[category]  # Update counts for e34 extracted\n",
        "        total_extracted_in_34 = len(e34_extracted)  # Total extracted samples in e34\n",
        "\n",
        "        min_denominator_ext_12 = total_extracted_in_12 * 1e-6  # Minimum denominator for e12 extracted\n",
        "        probabilities_ext_12 = counts_extra_12 / (total_extracted_in_12 + min_denominator_ext_12)  # Probabilities for e12 extracted\n",
        "        probabilities_tensor_extra_12 = probabilities_ext_12.unsqueeze(0)  # Unsqueeze probabilities tensor for e12 extracted\n",
        "\n",
        "        min_denominator_ext_34 = total_extracted_in_34 * 1e-6  # Minimum denominator for e34 extracted\n",
        "        probabilities_ext_34 = counts_extra_34 / (total_extracted_in_34 + min_denominator_ext_34)  # Probabilities for e34 extracted\n",
        "        probabilities_tensor_extra_34 = probabilities_ext_34.unsqueeze(0)  # Unsqueeze probabilities tensor for e34 extracted\n",
        "\n",
        "        ############################### Variation x ###################################\n",
        "        in_12_all = probabilities_tensor_in_12\n",
        "        in_34_all = probabilities_tensor_in_34\n",
        "        in_12_extra = probabilities_tensor_extra_12\n",
        "        in_34_extra = probabilities_tensor_extra_34\n",
        "        weight_tra_probility_all = 1.0 / 2\n",
        "        dow_all = \\\n",
        "              (in_12_all*weight_tra_probility_all + in_34_all*weight_tra_probility_all +\n",
        "              in_12_extra*weight_tra_probility_all + in_34_extra*weight_tra_probility_all + 1e-30)\n",
        "        in_1_all = (in_12_all*weight_tra_probility_all) / dow_all\n",
        "        in_2_all = (in_34_all*weight_tra_probility_all) / dow_all\n",
        "        e_1_all = (in_12_extra*weight_tra_probility_all) / dow_all\n",
        "        e_2_all = (in_34_extra*weight_tra_probility_all) / dow_all\n",
        "        in_1_all = in_1_all[0]\n",
        "        in_2_all = in_2_all[0]\n",
        "        e_1_all = e_1_all[0]\n",
        "        e_2_all = e_2_all[0]\n",
        "        d_KL_all = torch.zeros(10)\n",
        "        k_divergence_all = (in_1_all + 1e-30) * torch.log(in_1_all / (e_1_all + 1e-30) + 1e-30)\n",
        "        k_divergence_all_ = (in_1_all + 1e-30) * torch.log(in_1_all / (e_2_all + 1e-30) + 1e-30)\n",
        "        d_KL_all = torch.max(abs(k_divergence_all))\n",
        "        d_KL_all_ = torch.max(abs(k_divergence_all_))\n",
        "        Variation_all = torch.max(d_KL_all, d_KL_all_)\n",
        "        Var_all.append(Variation_all)\n",
        "\n",
        "        ############################ Information ###################################\n",
        "        all_combinations = list(combinations(range(10), 2))\n",
        "        K = categrary_number * (categrary_number - 1)\n",
        "        result_tensor = torch.zeros(len(all_combinations) * 2)  # Calculate the difference of each pair of combinations and store in result tensor\n",
        "        for c in range(10):\n",
        "            for idx, (i, j) in enumerate(all_combinations):\n",
        "                s1 = abs(((split_e12_inform[c][i]/10) + 1e-30) * torch.log((split_e12_inform[c][i]/10) / ((split_e12_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                s3 = abs(((split_e34_inform[c][i]/10) + 1e-30) * torch.log((split_e34_inform[c][i]/10) / ((split_e34_inform[c][j]/10) + 1e-30) + 1e-30))\n",
        "                min_value = torch.min(s1, s3)\n",
        "                result_tensor[idx] = min_value.item()\n",
        "                idx_ = idx + len(all_combinations)\n",
        "                s1_ = abs(((split_e12_inform[c][j]/10) + 1e-30) * torch.log((split_e12_inform[c][j]/10) / ((split_e12_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                s3_ = abs(((split_e34_inform[c][j]/10) + 1e-30) * torch.log((split_e34_inform[c][j]/10) / ((split_e34_inform[c][i]/10) + 1e-30) + 1e-30))\n",
        "                min_value_ = torch.min(s1_, s3_)\n",
        "                result_tensor[idx_] = min_value_.item()\n",
        "        Information = torch.sum(result_tensor) / K\n",
        "        Inf.append(Information)\n",
        "\n",
        "        ############################ Generalization_Ratio ###################################\n",
        "        Generalization_Ratio = Variation_all * (Information + 1.0) / Information\n",
        "        Generalization_Ratio_.append(Generalization_Ratio)\n",
        "\n",
        "        ############################ Generalization Decision Process (GDP) ###################################\n",
        "        state_now = Generalization_Ratio\n",
        "        loss_before = loss_before.cuda()\n",
        "        state_before = state_before.cuda()\n",
        "        state_dis = state_now - state_before\n",
        "        result_tensor = torch.cat((loss_out_e1234.unsqueeze(0), loss_out_e3412.unsqueeze(0)), 0)\n",
        "\n",
        "        # Because two datasets loss_out_e1234 and loss_out_e3412 are used, and there are actions A1 and A2,\n",
        "        # choose one based on the reward\n",
        "        if state_dis >= 0.0:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "        else:\n",
        "            if los > 0.0:  # Not fitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 -= dis\n",
        "                    dis_before_A2 += dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 += dis\n",
        "                    dis_before_A2 -= dis\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "            else:  # Overfitting\n",
        "                if per == \"A1\":\n",
        "                    dis_before_A1 += dis * 2\n",
        "                    dis_before_A2 -= dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                elif per == \"A2\":\n",
        "                    dis_before_A1 -= dis * 2\n",
        "                    dis_before_A2 += dis * 2\n",
        "                    if dis_before_A1 >= dis_before_A2:\n",
        "                        loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                        per = \"A1\"\n",
        "                    else:\n",
        "                        loss = random.choices(result_tensor, weights=[1, 3])[0]\n",
        "                        dis_before_A1 = dis_before_A1 * (1 / 4)\n",
        "                        dis_before_A2 = dis_before_A2 * (3 / 4)\n",
        "                        per = \"A2\"\n",
        "                else:\n",
        "                    loss = random.choices(result_tensor, weights=[3, 1])[0]\n",
        "                    dis_before_A1 = dis_before_A1 * (3 / 4)\n",
        "                    dis_before_A2 = dis_before_A2 * (1 / 4)\n",
        "                    per = \"A1\"\n",
        "\n",
        "        ####################################\n",
        "        #### optimizer\n",
        "        los = loss - loss_before\n",
        "        state_before = state_now\n",
        "        optimizer_L.zero_grad()\n",
        "        loss.backward()\n",
        "        optimizer_L.step()\n",
        "        loss_before = loss\n",
        "        running_loss += loss.item()\n",
        "\n",
        "        # Print statistics\n",
        "        if step % 5 == 4:  # Print every 500 mini-batches\n",
        "            with torch.no_grad():  # 'with' is a context manager\n",
        "                s_test_image = s_test_image.cuda()\n",
        "                s_test_label = s_test_label.cuda()\n",
        "                s_tra_image = s_tra_image.cuda()\n",
        "                s_tra_label = s_tra_label.cuda()\n",
        "                outputs = net(s_test_image)  # [batch, 10]\n",
        "                predict_y = torch.max(outputs, dim=1)[1]\n",
        "                accuracy = torch.eq(predict_y, s_test_label).sum().item() / s_test_label.size(0)\n",
        "                a_test.append(float(accuracy))\n",
        "                outputs_t = net(s_tra_image)  # [batch, 10]\n",
        "                predict_y_t = torch.max(outputs_t, dim=1)[1]\n",
        "                accuracy_t = torch.eq(predict_y_t, s_tra_label).sum().item() / s_tra_label.size(0)\n",
        "                a_train.append(float(accuracy_t))\n",
        "                lossaaa.append(float(running_loss / 5))\n",
        "                print('[%d, %5d] train_loss: %.3f train_accuracy: %.3f test_accuracy: %.3f' %\n",
        "                      (epoch + 1, step + 1, running_loss / 5, accuracy_t, accuracy))\n",
        "                running_loss = 0.0\n",
        "                running_loss = 0.0"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "j8oi02NhFEFu",
        "outputId": "1147cbb8-b1b5-4264-954c-d3b1ccb260ff"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "Files already downloaded and verified\n",
            "[1,     5] train_loss: 2.275 train_accuracy: 0.129 test_accuracy: 0.131\n",
            "[1,    10] train_loss: 2.233 train_accuracy: 0.181 test_accuracy: 0.180\n",
            "[1,    15] train_loss: 2.150 train_accuracy: 0.185 test_accuracy: 0.186\n",
            "[1,    20] train_loss: 2.135 train_accuracy: 0.186 test_accuracy: 0.185\n",
            "[1,    25] train_loss: 2.049 train_accuracy: 0.218 test_accuracy: 0.219\n",
            "[1,    30] train_loss: 2.099 train_accuracy: 0.194 test_accuracy: 0.199\n",
            "[1,    35] train_loss: 2.068 train_accuracy: 0.188 test_accuracy: 0.188\n",
            "[1,    40] train_loss: 2.110 train_accuracy: 0.236 test_accuracy: 0.237\n",
            "[1,    45] train_loss: 2.058 train_accuracy: 0.225 test_accuracy: 0.227\n",
            "[1,    50] train_loss: 2.098 train_accuracy: 0.246 test_accuracy: 0.248\n",
            "[1,    55] train_loss: 2.034 train_accuracy: 0.240 test_accuracy: 0.240\n",
            "[1,    60] train_loss: 2.062 train_accuracy: 0.252 test_accuracy: 0.251\n",
            "[1,    65] train_loss: 2.010 train_accuracy: 0.251 test_accuracy: 0.253\n",
            "[1,    70] train_loss: 2.125 train_accuracy: 0.225 test_accuracy: 0.226\n",
            "[1,    75] train_loss: 2.125 train_accuracy: 0.233 test_accuracy: 0.234\n",
            "[1,    80] train_loss: 1.999 train_accuracy: 0.271 test_accuracy: 0.265\n",
            "[1,    85] train_loss: 1.988 train_accuracy: 0.253 test_accuracy: 0.256\n",
            "[1,    90] train_loss: 2.045 train_accuracy: 0.278 test_accuracy: 0.283\n",
            "[1,    95] train_loss: 2.043 train_accuracy: 0.283 test_accuracy: 0.285\n",
            "[1,   100] train_loss: 1.943 train_accuracy: 0.250 test_accuracy: 0.251\n",
            "[1,   105] train_loss: 1.991 train_accuracy: 0.255 test_accuracy: 0.251\n",
            "[1,   110] train_loss: 1.930 train_accuracy: 0.260 test_accuracy: 0.256\n",
            "[1,   115] train_loss: 1.942 train_accuracy: 0.289 test_accuracy: 0.291\n",
            "[1,   120] train_loss: 1.970 train_accuracy: 0.279 test_accuracy: 0.276\n",
            "[1,   125] train_loss: 2.054 train_accuracy: 0.290 test_accuracy: 0.290\n",
            "[1,   130] train_loss: 1.974 train_accuracy: 0.297 test_accuracy: 0.296\n",
            "[1,   135] train_loss: 1.920 train_accuracy: 0.303 test_accuracy: 0.300\n",
            "[1,   140] train_loss: 1.986 train_accuracy: 0.301 test_accuracy: 0.294\n",
            "[1,   145] train_loss: 1.923 train_accuracy: 0.306 test_accuracy: 0.309\n",
            "[1,   150] train_loss: 1.846 train_accuracy: 0.295 test_accuracy: 0.293\n",
            "[1,   155] train_loss: 1.933 train_accuracy: 0.289 test_accuracy: 0.294\n",
            "[1,   160] train_loss: 2.005 train_accuracy: 0.303 test_accuracy: 0.303\n",
            "[1,   165] train_loss: 1.944 train_accuracy: 0.324 test_accuracy: 0.327\n",
            "[1,   170] train_loss: 1.953 train_accuracy: 0.314 test_accuracy: 0.312\n",
            "[1,   175] train_loss: 1.905 train_accuracy: 0.257 test_accuracy: 0.261\n",
            "[1,   180] train_loss: 1.924 train_accuracy: 0.291 test_accuracy: 0.292\n",
            "[1,   185] train_loss: 1.947 train_accuracy: 0.293 test_accuracy: 0.290\n",
            "[1,   190] train_loss: 1.948 train_accuracy: 0.297 test_accuracy: 0.298\n",
            "[1,   195] train_loss: 1.814 train_accuracy: 0.317 test_accuracy: 0.314\n",
            "[1,   200] train_loss: 1.942 train_accuracy: 0.321 test_accuracy: 0.318\n",
            "[1,   205] train_loss: 1.965 train_accuracy: 0.307 test_accuracy: 0.303\n",
            "[1,   210] train_loss: 2.042 train_accuracy: 0.309 test_accuracy: 0.308\n",
            "[1,   215] train_loss: 1.925 train_accuracy: 0.335 test_accuracy: 0.327\n",
            "[1,   220] train_loss: 1.927 train_accuracy: 0.307 test_accuracy: 0.303\n",
            "[1,   225] train_loss: 1.909 train_accuracy: 0.314 test_accuracy: 0.316\n",
            "[1,   230] train_loss: 1.972 train_accuracy: 0.306 test_accuracy: 0.302\n",
            "[1,   235] train_loss: 1.967 train_accuracy: 0.308 test_accuracy: 0.307\n",
            "[1,   240] train_loss: 1.920 train_accuracy: 0.316 test_accuracy: 0.309\n",
            "[1,   245] train_loss: 1.889 train_accuracy: 0.315 test_accuracy: 0.312\n",
            "[1,   250] train_loss: 1.958 train_accuracy: 0.330 test_accuracy: 0.321\n",
            "[1,   255] train_loss: 1.874 train_accuracy: 0.329 test_accuracy: 0.327\n",
            "[1,   260] train_loss: 1.921 train_accuracy: 0.339 test_accuracy: 0.333\n",
            "[1,   265] train_loss: 1.946 train_accuracy: 0.339 test_accuracy: 0.331\n",
            "[1,   270] train_loss: 1.827 train_accuracy: 0.338 test_accuracy: 0.337\n",
            "[1,   275] train_loss: 1.750 train_accuracy: 0.328 test_accuracy: 0.323\n",
            "[1,   280] train_loss: 1.878 train_accuracy: 0.325 test_accuracy: 0.321\n",
            "[1,   285] train_loss: 1.815 train_accuracy: 0.335 test_accuracy: 0.330\n",
            "[1,   290] train_loss: 1.827 train_accuracy: 0.327 test_accuracy: 0.326\n",
            "[1,   295] train_loss: 1.987 train_accuracy: 0.314 test_accuracy: 0.319\n",
            "[1,   300] train_loss: 1.855 train_accuracy: 0.335 test_accuracy: 0.343\n",
            "[1,   305] train_loss: 1.833 train_accuracy: 0.347 test_accuracy: 0.356\n",
            "[1,   310] train_loss: 1.826 train_accuracy: 0.346 test_accuracy: 0.342\n",
            "[1,   315] train_loss: 1.876 train_accuracy: 0.350 test_accuracy: 0.342\n",
            "[1,   320] train_loss: 1.782 train_accuracy: 0.343 test_accuracy: 0.343\n",
            "[1,   325] train_loss: 1.777 train_accuracy: 0.340 test_accuracy: 0.345\n",
            "[1,   330] train_loss: 1.801 train_accuracy: 0.345 test_accuracy: 0.348\n",
            "[1,   335] train_loss: 1.964 train_accuracy: 0.329 test_accuracy: 0.327\n",
            "[1,   340] train_loss: 1.845 train_accuracy: 0.353 test_accuracy: 0.348\n",
            "[1,   345] train_loss: 1.889 train_accuracy: 0.344 test_accuracy: 0.342\n",
            "[1,   350] train_loss: 1.792 train_accuracy: 0.346 test_accuracy: 0.343\n",
            "[1,   355] train_loss: 1.821 train_accuracy: 0.335 test_accuracy: 0.330\n",
            "[1,   360] train_loss: 1.804 train_accuracy: 0.350 test_accuracy: 0.344\n",
            "[1,   365] train_loss: 1.780 train_accuracy: 0.346 test_accuracy: 0.340\n",
            "[1,   370] train_loss: 1.895 train_accuracy: 0.331 test_accuracy: 0.329\n",
            "[1,   375] train_loss: 1.936 train_accuracy: 0.334 test_accuracy: 0.325\n",
            "[1,   380] train_loss: 1.848 train_accuracy: 0.360 test_accuracy: 0.354\n",
            "[1,   385] train_loss: 1.882 train_accuracy: 0.360 test_accuracy: 0.361\n",
            "[1,   390] train_loss: 1.817 train_accuracy: 0.362 test_accuracy: 0.365\n",
            "[1,   395] train_loss: 1.816 train_accuracy: 0.363 test_accuracy: 0.368\n",
            "[1,   400] train_loss: 1.915 train_accuracy: 0.364 test_accuracy: 0.366\n",
            "[1,   405] train_loss: 1.786 train_accuracy: 0.372 test_accuracy: 0.370\n",
            "[1,   410] train_loss: 1.722 train_accuracy: 0.357 test_accuracy: 0.353\n",
            "[1,   415] train_loss: 1.965 train_accuracy: 0.364 test_accuracy: 0.355\n",
            "[1,   420] train_loss: 1.774 train_accuracy: 0.359 test_accuracy: 0.353\n",
            "[1,   425] train_loss: 1.780 train_accuracy: 0.369 test_accuracy: 0.360\n",
            "[1,   430] train_loss: 1.857 train_accuracy: 0.364 test_accuracy: 0.358\n",
            "[1,   435] train_loss: 1.846 train_accuracy: 0.369 test_accuracy: 0.369\n",
            "[1,   440] train_loss: 1.840 train_accuracy: 0.384 test_accuracy: 0.378\n",
            "[1,   445] train_loss: 1.702 train_accuracy: 0.389 test_accuracy: 0.384\n",
            "[1,   450] train_loss: 1.870 train_accuracy: 0.377 test_accuracy: 0.378\n",
            "[1,   455] train_loss: 1.797 train_accuracy: 0.369 test_accuracy: 0.368\n",
            "[1,   460] train_loss: 1.745 train_accuracy: 0.360 test_accuracy: 0.357\n",
            "[1,   465] train_loss: 1.791 train_accuracy: 0.379 test_accuracy: 0.369\n",
            "[1,   470] train_loss: 1.759 train_accuracy: 0.378 test_accuracy: 0.370\n",
            "[1,   475] train_loss: 1.839 train_accuracy: 0.350 test_accuracy: 0.341\n",
            "[1,   480] train_loss: 1.884 train_accuracy: 0.356 test_accuracy: 0.350\n",
            "[1,   485] train_loss: 1.879 train_accuracy: 0.364 test_accuracy: 0.360\n",
            "[1,   490] train_loss: 1.729 train_accuracy: 0.376 test_accuracy: 0.377\n",
            "[1,   495] train_loss: 1.827 train_accuracy: 0.379 test_accuracy: 0.381\n",
            "[1,   500] train_loss: 1.855 train_accuracy: 0.361 test_accuracy: 0.363\n",
            "[1,   505] train_loss: 1.936 train_accuracy: 0.362 test_accuracy: 0.357\n",
            "[1,   510] train_loss: 1.764 train_accuracy: 0.369 test_accuracy: 0.372\n",
            "[1,   515] train_loss: 1.866 train_accuracy: 0.384 test_accuracy: 0.386\n",
            "[1,   520] train_loss: 1.761 train_accuracy: 0.394 test_accuracy: 0.391\n",
            "[1,   525] train_loss: 1.792 train_accuracy: 0.393 test_accuracy: 0.384\n",
            "[1,   530] train_loss: 1.874 train_accuracy: 0.379 test_accuracy: 0.377\n",
            "[1,   535] train_loss: 1.825 train_accuracy: 0.385 test_accuracy: 0.389\n",
            "[1,   540] train_loss: 1.787 train_accuracy: 0.385 test_accuracy: 0.388\n",
            "[1,   545] train_loss: 1.803 train_accuracy: 0.390 test_accuracy: 0.393\n",
            "[1,   550] train_loss: 1.650 train_accuracy: 0.362 test_accuracy: 0.355\n",
            "[1,   555] train_loss: 1.829 train_accuracy: 0.373 test_accuracy: 0.368\n",
            "[1,   560] train_loss: 1.852 train_accuracy: 0.365 test_accuracy: 0.366\n",
            "[1,   565] train_loss: 1.671 train_accuracy: 0.369 test_accuracy: 0.353\n",
            "[1,   570] train_loss: 1.746 train_accuracy: 0.376 test_accuracy: 0.362\n",
            "[1,   575] train_loss: 1.762 train_accuracy: 0.394 test_accuracy: 0.389\n",
            "[1,   580] train_loss: 1.756 train_accuracy: 0.400 test_accuracy: 0.405\n",
            "[1,   585] train_loss: 1.857 train_accuracy: 0.403 test_accuracy: 0.405\n",
            "[1,   590] train_loss: 1.830 train_accuracy: 0.388 test_accuracy: 0.387\n",
            "[1,   595] train_loss: 1.661 train_accuracy: 0.386 test_accuracy: 0.387\n",
            "[1,   600] train_loss: 1.689 train_accuracy: 0.399 test_accuracy: 0.392\n",
            "[1,   605] train_loss: 1.711 train_accuracy: 0.383 test_accuracy: 0.374\n",
            "[1,   610] train_loss: 1.769 train_accuracy: 0.379 test_accuracy: 0.379\n",
            "[1,   615] train_loss: 1.776 train_accuracy: 0.374 test_accuracy: 0.376\n",
            "[1,   620] train_loss: 1.841 train_accuracy: 0.389 test_accuracy: 0.386\n",
            "[1,   625] train_loss: 1.729 train_accuracy: 0.389 test_accuracy: 0.380\n",
            "[1,   630] train_loss: 1.805 train_accuracy: 0.395 test_accuracy: 0.386\n",
            "[1,   635] train_loss: 1.665 train_accuracy: 0.400 test_accuracy: 0.402\n",
            "[1,   640] train_loss: 1.694 train_accuracy: 0.398 test_accuracy: 0.405\n",
            "[1,   645] train_loss: 1.648 train_accuracy: 0.388 test_accuracy: 0.396\n",
            "[1,   650] train_loss: 1.789 train_accuracy: 0.376 test_accuracy: 0.380\n",
            "[1,   655] train_loss: 1.763 train_accuracy: 0.392 test_accuracy: 0.392\n",
            "[1,   660] train_loss: 1.616 train_accuracy: 0.386 test_accuracy: 0.381\n",
            "[1,   665] train_loss: 1.773 train_accuracy: 0.371 test_accuracy: 0.377\n",
            "[1,   670] train_loss: 1.738 train_accuracy: 0.388 test_accuracy: 0.392\n",
            "[1,   675] train_loss: 1.630 train_accuracy: 0.399 test_accuracy: 0.398\n",
            "[1,   680] train_loss: 1.700 train_accuracy: 0.404 test_accuracy: 0.408\n",
            "[1,   685] train_loss: 1.628 train_accuracy: 0.403 test_accuracy: 0.404\n",
            "[1,   690] train_loss: 1.677 train_accuracy: 0.385 test_accuracy: 0.397\n",
            "[1,   695] train_loss: 1.650 train_accuracy: 0.391 test_accuracy: 0.399\n",
            "[1,   700] train_loss: 1.716 train_accuracy: 0.345 test_accuracy: 0.348\n",
            "[1,   705] train_loss: 1.804 train_accuracy: 0.341 test_accuracy: 0.340\n",
            "[1,   710] train_loss: 1.781 train_accuracy: 0.341 test_accuracy: 0.342\n",
            "[1,   715] train_loss: 1.695 train_accuracy: 0.374 test_accuracy: 0.380\n",
            "[1,   720] train_loss: 1.709 train_accuracy: 0.378 test_accuracy: 0.377\n",
            "[1,   725] train_loss: 1.722 train_accuracy: 0.384 test_accuracy: 0.382\n",
            "[1,   730] train_loss: 1.800 train_accuracy: 0.397 test_accuracy: 0.400\n",
            "[1,   735] train_loss: 1.724 train_accuracy: 0.394 test_accuracy: 0.392\n",
            "[1,   740] train_loss: 1.754 train_accuracy: 0.401 test_accuracy: 0.395\n",
            "[1,   745] train_loss: 1.812 train_accuracy: 0.405 test_accuracy: 0.402\n",
            "[1,   750] train_loss: 1.689 train_accuracy: 0.391 test_accuracy: 0.397\n",
            "[1,   755] train_loss: 1.755 train_accuracy: 0.384 test_accuracy: 0.389\n",
            "[1,   760] train_loss: 1.739 train_accuracy: 0.407 test_accuracy: 0.411\n",
            "[1,   765] train_loss: 1.767 train_accuracy: 0.416 test_accuracy: 0.417\n",
            "[1,   770] train_loss: 1.600 train_accuracy: 0.405 test_accuracy: 0.402\n",
            "[1,   775] train_loss: 1.742 train_accuracy: 0.407 test_accuracy: 0.409\n",
            "[1,   780] train_loss: 1.553 train_accuracy: 0.387 test_accuracy: 0.387\n",
            "[1,   785] train_loss: 1.624 train_accuracy: 0.392 test_accuracy: 0.393\n",
            "[1,   790] train_loss: 1.677 train_accuracy: 0.381 test_accuracy: 0.382\n",
            "[1,   795] train_loss: 1.636 train_accuracy: 0.391 test_accuracy: 0.394\n",
            "[1,   800] train_loss: 1.672 train_accuracy: 0.400 test_accuracy: 0.397\n",
            "[1,   805] train_loss: 1.722 train_accuracy: 0.404 test_accuracy: 0.398\n",
            "[1,   810] train_loss: 1.690 train_accuracy: 0.414 test_accuracy: 0.399\n",
            "[1,   815] train_loss: 1.762 train_accuracy: 0.419 test_accuracy: 0.409\n",
            "[1,   820] train_loss: 1.614 train_accuracy: 0.396 test_accuracy: 0.388\n",
            "[1,   825] train_loss: 1.746 train_accuracy: 0.396 test_accuracy: 0.397\n",
            "[1,   830] train_loss: 1.610 train_accuracy: 0.390 test_accuracy: 0.387\n",
            "[1,   835] train_loss: 1.726 train_accuracy: 0.385 test_accuracy: 0.385\n",
            "[1,   840] train_loss: 1.678 train_accuracy: 0.389 test_accuracy: 0.384\n",
            "[1,   845] train_loss: 1.584 train_accuracy: 0.402 test_accuracy: 0.398\n",
            "[1,   850] train_loss: 1.843 train_accuracy: 0.409 test_accuracy: 0.406\n",
            "[1,   855] train_loss: 1.617 train_accuracy: 0.419 test_accuracy: 0.417\n",
            "[1,   860] train_loss: 1.638 train_accuracy: 0.407 test_accuracy: 0.404\n",
            "[1,   865] train_loss: 1.753 train_accuracy: 0.408 test_accuracy: 0.402\n",
            "[1,   870] train_loss: 1.577 train_accuracy: 0.409 test_accuracy: 0.403\n",
            "[1,   875] train_loss: 1.733 train_accuracy: 0.404 test_accuracy: 0.405\n",
            "[1,   880] train_loss: 1.727 train_accuracy: 0.415 test_accuracy: 0.419\n",
            "[1,   885] train_loss: 1.726 train_accuracy: 0.405 test_accuracy: 0.400\n",
            "[1,   890] train_loss: 1.677 train_accuracy: 0.398 test_accuracy: 0.398\n",
            "[1,   895] train_loss: 1.602 train_accuracy: 0.419 test_accuracy: 0.418\n",
            "[1,   900] train_loss: 1.712 train_accuracy: 0.401 test_accuracy: 0.405\n",
            "[1,   905] train_loss: 1.676 train_accuracy: 0.388 test_accuracy: 0.391\n",
            "[1,   910] train_loss: 1.730 train_accuracy: 0.400 test_accuracy: 0.405\n",
            "[1,   915] train_loss: 1.646 train_accuracy: 0.403 test_accuracy: 0.403\n",
            "[1,   920] train_loss: 1.758 train_accuracy: 0.400 test_accuracy: 0.399\n",
            "[1,   925] train_loss: 1.661 train_accuracy: 0.396 test_accuracy: 0.402\n",
            "[1,   930] train_loss: 1.656 train_accuracy: 0.400 test_accuracy: 0.404\n",
            "[1,   935] train_loss: 1.592 train_accuracy: 0.421 test_accuracy: 0.415\n",
            "[1,   940] train_loss: 1.735 train_accuracy: 0.415 test_accuracy: 0.408\n",
            "[1,   945] train_loss: 1.719 train_accuracy: 0.409 test_accuracy: 0.403\n",
            "[1,   950] train_loss: 1.727 train_accuracy: 0.421 test_accuracy: 0.417\n",
            "[1,   955] train_loss: 1.641 train_accuracy: 0.413 test_accuracy: 0.406\n",
            "[1,   960] train_loss: 1.727 train_accuracy: 0.406 test_accuracy: 0.406\n",
            "[1,   965] train_loss: 1.517 train_accuracy: 0.413 test_accuracy: 0.414\n",
            "[1,   970] train_loss: 1.771 train_accuracy: 0.401 test_accuracy: 0.400\n",
            "[1,   975] train_loss: 1.586 train_accuracy: 0.420 test_accuracy: 0.416\n",
            "[1,   980] train_loss: 1.688 train_accuracy: 0.409 test_accuracy: 0.403\n",
            "[1,   985] train_loss: 1.740 train_accuracy: 0.412 test_accuracy: 0.408\n",
            "[1,   990] train_loss: 1.670 train_accuracy: 0.417 test_accuracy: 0.409\n",
            "[1,   995] train_loss: 1.635 train_accuracy: 0.417 test_accuracy: 0.418\n",
            "[1,  1000] train_loss: 1.546 train_accuracy: 0.422 test_accuracy: 0.421\n",
            "[1,  1005] train_loss: 1.771 train_accuracy: 0.427 test_accuracy: 0.418\n",
            "[1,  1010] train_loss: 1.497 train_accuracy: 0.417 test_accuracy: 0.412\n",
            "[1,  1015] train_loss: 1.571 train_accuracy: 0.415 test_accuracy: 0.406\n",
            "[1,  1020] train_loss: 1.648 train_accuracy: 0.411 test_accuracy: 0.400\n",
            "[1,  1025] train_loss: 1.670 train_accuracy: 0.416 test_accuracy: 0.406\n",
            "[1,  1030] train_loss: 1.784 train_accuracy: 0.426 test_accuracy: 0.418\n",
            "[1,  1035] train_loss: 1.752 train_accuracy: 0.413 test_accuracy: 0.416\n",
            "[1,  1040] train_loss: 1.727 train_accuracy: 0.419 test_accuracy: 0.421\n",
            "[1,  1045] train_loss: 1.659 train_accuracy: 0.426 test_accuracy: 0.421\n",
            "[1,  1050] train_loss: 1.648 train_accuracy: 0.429 test_accuracy: 0.424\n",
            "[1,  1055] train_loss: 1.667 train_accuracy: 0.435 test_accuracy: 0.431\n",
            "[1,  1060] train_loss: 1.588 train_accuracy: 0.425 test_accuracy: 0.418\n",
            "[1,  1065] train_loss: 1.720 train_accuracy: 0.424 test_accuracy: 0.425\n",
            "[1,  1070] train_loss: 1.564 train_accuracy: 0.429 test_accuracy: 0.416\n",
            "[1,  1075] train_loss: 1.565 train_accuracy: 0.422 test_accuracy: 0.410\n",
            "[1,  1080] train_loss: 1.758 train_accuracy: 0.431 test_accuracy: 0.419\n",
            "[1,  1085] train_loss: 1.650 train_accuracy: 0.433 test_accuracy: 0.426\n",
            "[1,  1090] train_loss: 1.638 train_accuracy: 0.436 test_accuracy: 0.427\n",
            "[1,  1095] train_loss: 1.720 train_accuracy: 0.423 test_accuracy: 0.414\n",
            "[1,  1100] train_loss: 1.570 train_accuracy: 0.429 test_accuracy: 0.424\n",
            "[1,  1105] train_loss: 1.668 train_accuracy: 0.423 test_accuracy: 0.421\n",
            "[1,  1110] train_loss: 1.621 train_accuracy: 0.432 test_accuracy: 0.431\n",
            "[1,  1115] train_loss: 1.610 train_accuracy: 0.432 test_accuracy: 0.425\n",
            "[1,  1120] train_loss: 1.729 train_accuracy: 0.434 test_accuracy: 0.425\n",
            "[1,  1125] train_loss: 1.716 train_accuracy: 0.440 test_accuracy: 0.430\n",
            "[1,  1130] train_loss: 1.676 train_accuracy: 0.434 test_accuracy: 0.424\n",
            "[1,  1135] train_loss: 1.739 train_accuracy: 0.409 test_accuracy: 0.405\n",
            "[1,  1140] train_loss: 1.646 train_accuracy: 0.432 test_accuracy: 0.428\n",
            "[1,  1145] train_loss: 1.713 train_accuracy: 0.445 test_accuracy: 0.433\n",
            "[1,  1150] train_loss: 1.690 train_accuracy: 0.430 test_accuracy: 0.421\n",
            "[1,  1155] train_loss: 1.681 train_accuracy: 0.432 test_accuracy: 0.421\n",
            "[1,  1160] train_loss: 1.876 train_accuracy: 0.436 test_accuracy: 0.426\n",
            "[1,  1165] train_loss: 1.729 train_accuracy: 0.422 test_accuracy: 0.414\n",
            "[1,  1170] train_loss: 1.713 train_accuracy: 0.430 test_accuracy: 0.427\n",
            "[1,  1175] train_loss: 1.692 train_accuracy: 0.433 test_accuracy: 0.429\n",
            "[1,  1180] train_loss: 1.691 train_accuracy: 0.417 test_accuracy: 0.413\n",
            "[1,  1185] train_loss: 1.608 train_accuracy: 0.430 test_accuracy: 0.424\n",
            "[1,  1190] train_loss: 1.558 train_accuracy: 0.431 test_accuracy: 0.419\n",
            "[1,  1195] train_loss: 1.526 train_accuracy: 0.423 test_accuracy: 0.421\n",
            "[1,  1200] train_loss: 1.671 train_accuracy: 0.433 test_accuracy: 0.432\n",
            "[1,  1205] train_loss: 1.637 train_accuracy: 0.422 test_accuracy: 0.418\n",
            "[1,  1210] train_loss: 1.575 train_accuracy: 0.423 test_accuracy: 0.404\n",
            "[1,  1215] train_loss: 1.678 train_accuracy: 0.419 test_accuracy: 0.412\n",
            "[1,  1220] train_loss: 1.701 train_accuracy: 0.435 test_accuracy: 0.430\n",
            "[1,  1225] train_loss: 1.545 train_accuracy: 0.432 test_accuracy: 0.429\n",
            "[1,  1230] train_loss: 1.492 train_accuracy: 0.427 test_accuracy: 0.417\n",
            "[1,  1235] train_loss: 1.670 train_accuracy: 0.439 test_accuracy: 0.429\n",
            "[1,  1240] train_loss: 1.617 train_accuracy: 0.439 test_accuracy: 0.430\n",
            "[1,  1245] train_loss: 1.542 train_accuracy: 0.439 test_accuracy: 0.432\n",
            "[2,     5] train_loss: 1.516 train_accuracy: 0.444 test_accuracy: 0.439\n",
            "[2,    10] train_loss: 1.677 train_accuracy: 0.445 test_accuracy: 0.432\n",
            "[2,    15] train_loss: 1.602 train_accuracy: 0.431 test_accuracy: 0.419\n",
            "[2,    20] train_loss: 1.555 train_accuracy: 0.435 test_accuracy: 0.421\n",
            "[2,    25] train_loss: 1.548 train_accuracy: 0.433 test_accuracy: 0.426\n",
            "[2,    30] train_loss: 1.662 train_accuracy: 0.446 test_accuracy: 0.438\n",
            "[2,    35] train_loss: 1.792 train_accuracy: 0.443 test_accuracy: 0.435\n",
            "[2,    40] train_loss: 1.703 train_accuracy: 0.426 test_accuracy: 0.411\n",
            "[2,    45] train_loss: 1.586 train_accuracy: 0.422 test_accuracy: 0.407\n",
            "[2,    50] train_loss: 1.500 train_accuracy: 0.435 test_accuracy: 0.417\n",
            "[2,    55] train_loss: 1.543 train_accuracy: 0.441 test_accuracy: 0.427\n",
            "[2,    60] train_loss: 1.623 train_accuracy: 0.440 test_accuracy: 0.432\n",
            "[2,    65] train_loss: 1.669 train_accuracy: 0.435 test_accuracy: 0.429\n",
            "[2,    70] train_loss: 1.584 train_accuracy: 0.444 test_accuracy: 0.431\n",
            "[2,    75] train_loss: 1.635 train_accuracy: 0.453 test_accuracy: 0.442\n",
            "[2,    80] train_loss: 1.606 train_accuracy: 0.443 test_accuracy: 0.432\n",
            "[2,    85] train_loss: 1.540 train_accuracy: 0.427 test_accuracy: 0.427\n",
            "[2,    90] train_loss: 1.589 train_accuracy: 0.451 test_accuracy: 0.449\n",
            "[2,    95] train_loss: 1.633 train_accuracy: 0.448 test_accuracy: 0.440\n",
            "[2,   100] train_loss: 1.610 train_accuracy: 0.450 test_accuracy: 0.436\n",
            "[2,   105] train_loss: 1.628 train_accuracy: 0.451 test_accuracy: 0.437\n",
            "[2,   110] train_loss: 1.549 train_accuracy: 0.456 test_accuracy: 0.447\n",
            "[2,   115] train_loss: 1.620 train_accuracy: 0.455 test_accuracy: 0.447\n",
            "[2,   120] train_loss: 1.470 train_accuracy: 0.449 test_accuracy: 0.439\n",
            "[2,   125] train_loss: 1.560 train_accuracy: 0.452 test_accuracy: 0.438\n",
            "[2,   130] train_loss: 1.403 train_accuracy: 0.438 test_accuracy: 0.432\n",
            "[2,   135] train_loss: 1.586 train_accuracy: 0.427 test_accuracy: 0.415\n",
            "[2,   140] train_loss: 1.542 train_accuracy: 0.457 test_accuracy: 0.446\n",
            "[2,   145] train_loss: 1.542 train_accuracy: 0.465 test_accuracy: 0.448\n",
            "[2,   150] train_loss: 1.547 train_accuracy: 0.460 test_accuracy: 0.437\n",
            "[2,   155] train_loss: 1.450 train_accuracy: 0.447 test_accuracy: 0.432\n",
            "[2,   160] train_loss: 1.683 train_accuracy: 0.457 test_accuracy: 0.443\n",
            "[2,   165] train_loss: 1.631 train_accuracy: 0.457 test_accuracy: 0.445\n",
            "[2,   170] train_loss: 1.589 train_accuracy: 0.449 test_accuracy: 0.440\n",
            "[2,   175] train_loss: 1.538 train_accuracy: 0.448 test_accuracy: 0.437\n",
            "[2,   180] train_loss: 1.690 train_accuracy: 0.432 test_accuracy: 0.422\n",
            "[2,   185] train_loss: 1.571 train_accuracy: 0.444 test_accuracy: 0.433\n",
            "[2,   190] train_loss: 1.525 train_accuracy: 0.445 test_accuracy: 0.434\n",
            "[2,   195] train_loss: 1.595 train_accuracy: 0.445 test_accuracy: 0.433\n",
            "[2,   200] train_loss: 1.583 train_accuracy: 0.449 test_accuracy: 0.439\n",
            "[2,   205] train_loss: 1.423 train_accuracy: 0.457 test_accuracy: 0.437\n",
            "[2,   210] train_loss: 1.563 train_accuracy: 0.466 test_accuracy: 0.448\n",
            "[2,   215] train_loss: 1.530 train_accuracy: 0.465 test_accuracy: 0.448\n",
            "[2,   220] train_loss: 1.632 train_accuracy: 0.460 test_accuracy: 0.447\n",
            "[2,   225] train_loss: 1.665 train_accuracy: 0.457 test_accuracy: 0.443\n",
            "[2,   230] train_loss: 1.595 train_accuracy: 0.440 test_accuracy: 0.425\n",
            "[2,   235] train_loss: 1.699 train_accuracy: 0.436 test_accuracy: 0.430\n",
            "[2,   240] train_loss: 1.630 train_accuracy: 0.451 test_accuracy: 0.442\n",
            "[2,   245] train_loss: 1.481 train_accuracy: 0.456 test_accuracy: 0.446\n",
            "[2,   250] train_loss: 1.509 train_accuracy: 0.441 test_accuracy: 0.430\n",
            "[2,   255] train_loss: 1.769 train_accuracy: 0.448 test_accuracy: 0.441\n",
            "[2,   260] train_loss: 1.653 train_accuracy: 0.437 test_accuracy: 0.430\n",
            "[2,   265] train_loss: 1.649 train_accuracy: 0.446 test_accuracy: 0.432\n",
            "[2,   270] train_loss: 1.598 train_accuracy: 0.454 test_accuracy: 0.434\n",
            "[2,   275] train_loss: 1.619 train_accuracy: 0.464 test_accuracy: 0.448\n",
            "[2,   280] train_loss: 1.538 train_accuracy: 0.466 test_accuracy: 0.450\n",
            "[2,   285] train_loss: 1.730 train_accuracy: 0.459 test_accuracy: 0.438\n",
            "[2,   290] train_loss: 1.553 train_accuracy: 0.458 test_accuracy: 0.440\n",
            "[2,   295] train_loss: 1.655 train_accuracy: 0.462 test_accuracy: 0.444\n",
            "[2,   300] train_loss: 1.526 train_accuracy: 0.442 test_accuracy: 0.425\n",
            "[2,   305] train_loss: 1.556 train_accuracy: 0.446 test_accuracy: 0.428\n",
            "[2,   310] train_loss: 1.603 train_accuracy: 0.449 test_accuracy: 0.432\n",
            "[2,   315] train_loss: 1.530 train_accuracy: 0.463 test_accuracy: 0.444\n",
            "[2,   320] train_loss: 1.570 train_accuracy: 0.458 test_accuracy: 0.444\n",
            "[2,   325] train_loss: 1.520 train_accuracy: 0.455 test_accuracy: 0.443\n",
            "[2,   330] train_loss: 1.605 train_accuracy: 0.469 test_accuracy: 0.440\n",
            "[2,   335] train_loss: 1.667 train_accuracy: 0.469 test_accuracy: 0.440\n",
            "[2,   340] train_loss: 1.598 train_accuracy: 0.463 test_accuracy: 0.429\n",
            "[2,   345] train_loss: 1.684 train_accuracy: 0.447 test_accuracy: 0.428\n",
            "[2,   350] train_loss: 1.608 train_accuracy: 0.451 test_accuracy: 0.440\n",
            "[2,   355] train_loss: 1.486 train_accuracy: 0.445 test_accuracy: 0.437\n",
            "[2,   360] train_loss: 1.540 train_accuracy: 0.454 test_accuracy: 0.436\n",
            "[2,   365] train_loss: 1.599 train_accuracy: 0.452 test_accuracy: 0.434\n",
            "[2,   370] train_loss: 1.577 train_accuracy: 0.440 test_accuracy: 0.423\n",
            "[2,   375] train_loss: 1.616 train_accuracy: 0.448 test_accuracy: 0.425\n",
            "[2,   380] train_loss: 1.533 train_accuracy: 0.453 test_accuracy: 0.432\n",
            "[2,   385] train_loss: 1.564 train_accuracy: 0.453 test_accuracy: 0.430\n",
            "[2,   390] train_loss: 1.480 train_accuracy: 0.441 test_accuracy: 0.425\n",
            "[2,   395] train_loss: 1.629 train_accuracy: 0.459 test_accuracy: 0.446\n",
            "[2,   400] train_loss: 1.424 train_accuracy: 0.461 test_accuracy: 0.445\n",
            "[2,   405] train_loss: 1.643 train_accuracy: 0.455 test_accuracy: 0.441\n",
            "[2,   410] train_loss: 1.598 train_accuracy: 0.453 test_accuracy: 0.442\n",
            "[2,   415] train_loss: 1.770 train_accuracy: 0.457 test_accuracy: 0.440\n",
            "[2,   420] train_loss: 1.575 train_accuracy: 0.459 test_accuracy: 0.444\n",
            "[2,   425] train_loss: 1.506 train_accuracy: 0.469 test_accuracy: 0.449\n",
            "[2,   430] train_loss: 1.563 train_accuracy: 0.457 test_accuracy: 0.438\n",
            "[2,   435] train_loss: 1.485 train_accuracy: 0.461 test_accuracy: 0.447\n",
            "[2,   440] train_loss: 1.682 train_accuracy: 0.469 test_accuracy: 0.463\n",
            "[2,   445] train_loss: 1.611 train_accuracy: 0.461 test_accuracy: 0.452\n",
            "[2,   450] train_loss: 1.588 train_accuracy: 0.466 test_accuracy: 0.452\n",
            "[2,   455] train_loss: 1.585 train_accuracy: 0.467 test_accuracy: 0.454\n",
            "[2,   460] train_loss: 1.636 train_accuracy: 0.465 test_accuracy: 0.450\n",
            "[2,   465] train_loss: 1.592 train_accuracy: 0.462 test_accuracy: 0.443\n",
            "[2,   470] train_loss: 1.662 train_accuracy: 0.463 test_accuracy: 0.448\n",
            "[2,   475] train_loss: 1.693 train_accuracy: 0.455 test_accuracy: 0.441\n",
            "[2,   480] train_loss: 1.533 train_accuracy: 0.454 test_accuracy: 0.440\n",
            "[2,   485] train_loss: 1.494 train_accuracy: 0.463 test_accuracy: 0.447\n",
            "[2,   490] train_loss: 1.542 train_accuracy: 0.461 test_accuracy: 0.445\n",
            "[2,   495] train_loss: 1.466 train_accuracy: 0.463 test_accuracy: 0.447\n",
            "[2,   500] train_loss: 1.605 train_accuracy: 0.453 test_accuracy: 0.440\n",
            "[2,   505] train_loss: 1.469 train_accuracy: 0.461 test_accuracy: 0.443\n",
            "[2,   510] train_loss: 1.434 train_accuracy: 0.446 test_accuracy: 0.430\n",
            "[2,   515] train_loss: 1.581 train_accuracy: 0.470 test_accuracy: 0.455\n",
            "[2,   520] train_loss: 1.532 train_accuracy: 0.457 test_accuracy: 0.439\n",
            "[2,   525] train_loss: 1.573 train_accuracy: 0.445 test_accuracy: 0.432\n",
            "[2,   530] train_loss: 1.702 train_accuracy: 0.462 test_accuracy: 0.447\n",
            "[2,   535] train_loss: 1.426 train_accuracy: 0.452 test_accuracy: 0.443\n",
            "[2,   540] train_loss: 1.582 train_accuracy: 0.463 test_accuracy: 0.447\n",
            "[2,   545] train_loss: 1.518 train_accuracy: 0.465 test_accuracy: 0.443\n",
            "[2,   550] train_loss: 1.516 train_accuracy: 0.457 test_accuracy: 0.438\n",
            "[2,   555] train_loss: 1.498 train_accuracy: 0.476 test_accuracy: 0.456\n",
            "[2,   560] train_loss: 1.478 train_accuracy: 0.467 test_accuracy: 0.451\n",
            "[2,   565] train_loss: 1.556 train_accuracy: 0.457 test_accuracy: 0.442\n",
            "[2,   570] train_loss: 1.705 train_accuracy: 0.465 test_accuracy: 0.438\n",
            "[2,   575] train_loss: 1.709 train_accuracy: 0.457 test_accuracy: 0.434\n",
            "[2,   580] train_loss: 1.653 train_accuracy: 0.465 test_accuracy: 0.440\n",
            "[2,   585] train_loss: 1.627 train_accuracy: 0.475 test_accuracy: 0.449\n",
            "[2,   590] train_loss: 1.602 train_accuracy: 0.466 test_accuracy: 0.446\n",
            "[2,   595] train_loss: 1.506 train_accuracy: 0.456 test_accuracy: 0.440\n",
            "[2,   600] train_loss: 1.617 train_accuracy: 0.474 test_accuracy: 0.462\n",
            "[2,   605] train_loss: 1.606 train_accuracy: 0.476 test_accuracy: 0.460\n",
            "[2,   610] train_loss: 1.556 train_accuracy: 0.470 test_accuracy: 0.444\n",
            "[2,   615] train_loss: 1.490 train_accuracy: 0.473 test_accuracy: 0.447\n",
            "[2,   620] train_loss: 1.419 train_accuracy: 0.470 test_accuracy: 0.450\n",
            "[2,   625] train_loss: 1.553 train_accuracy: 0.476 test_accuracy: 0.457\n",
            "[2,   630] train_loss: 1.505 train_accuracy: 0.481 test_accuracy: 0.461\n",
            "[2,   635] train_loss: 1.381 train_accuracy: 0.457 test_accuracy: 0.435\n",
            "[2,   640] train_loss: 1.565 train_accuracy: 0.460 test_accuracy: 0.435\n",
            "[2,   645] train_loss: 1.654 train_accuracy: 0.464 test_accuracy: 0.444\n",
            "[2,   650] train_loss: 1.538 train_accuracy: 0.472 test_accuracy: 0.448\n",
            "[2,   655] train_loss: 1.541 train_accuracy: 0.473 test_accuracy: 0.450\n",
            "[2,   660] train_loss: 1.626 train_accuracy: 0.469 test_accuracy: 0.448\n",
            "[2,   665] train_loss: 1.476 train_accuracy: 0.447 test_accuracy: 0.433\n",
            "[2,   670] train_loss: 1.694 train_accuracy: 0.450 test_accuracy: 0.435\n",
            "[2,   675] train_loss: 1.691 train_accuracy: 0.462 test_accuracy: 0.443\n",
            "[2,   680] train_loss: 1.642 train_accuracy: 0.471 test_accuracy: 0.448\n",
            "[2,   685] train_loss: 1.411 train_accuracy: 0.468 test_accuracy: 0.442\n",
            "[2,   690] train_loss: 1.568 train_accuracy: 0.486 test_accuracy: 0.462\n",
            "[2,   695] train_loss: 1.613 train_accuracy: 0.468 test_accuracy: 0.450\n",
            "[2,   700] train_loss: 1.552 train_accuracy: 0.436 test_accuracy: 0.416\n",
            "[2,   705] train_loss: 1.642 train_accuracy: 0.449 test_accuracy: 0.424\n",
            "[2,   710] train_loss: 1.379 train_accuracy: 0.479 test_accuracy: 0.459\n",
            "[2,   715] train_loss: 1.420 train_accuracy: 0.473 test_accuracy: 0.456\n",
            "[2,   720] train_loss: 1.394 train_accuracy: 0.461 test_accuracy: 0.448\n",
            "[2,   725] train_loss: 1.454 train_accuracy: 0.470 test_accuracy: 0.448\n",
            "[2,   730] train_loss: 1.546 train_accuracy: 0.480 test_accuracy: 0.463\n",
            "[2,   735] train_loss: 1.561 train_accuracy: 0.461 test_accuracy: 0.444\n",
            "[2,   740] train_loss: 1.583 train_accuracy: 0.481 test_accuracy: 0.462\n",
            "[2,   745] train_loss: 1.529 train_accuracy: 0.475 test_accuracy: 0.464\n",
            "[2,   750] train_loss: 1.467 train_accuracy: 0.466 test_accuracy: 0.452\n",
            "[2,   755] train_loss: 1.499 train_accuracy: 0.470 test_accuracy: 0.451\n",
            "[2,   760] train_loss: 1.504 train_accuracy: 0.482 test_accuracy: 0.459\n",
            "[2,   765] train_loss: 1.562 train_accuracy: 0.479 test_accuracy: 0.461\n",
            "[2,   770] train_loss: 1.450 train_accuracy: 0.474 test_accuracy: 0.455\n",
            "[2,   775] train_loss: 1.568 train_accuracy: 0.468 test_accuracy: 0.453\n",
            "[2,   780] train_loss: 1.576 train_accuracy: 0.467 test_accuracy: 0.453\n",
            "[2,   785] train_loss: 1.513 train_accuracy: 0.481 test_accuracy: 0.462\n",
            "[2,   790] train_loss: 1.539 train_accuracy: 0.477 test_accuracy: 0.465\n",
            "[2,   795] train_loss: 1.554 train_accuracy: 0.470 test_accuracy: 0.455\n",
            "[2,   800] train_loss: 1.625 train_accuracy: 0.467 test_accuracy: 0.450\n",
            "[2,   805] train_loss: 1.523 train_accuracy: 0.459 test_accuracy: 0.445\n",
            "[2,   810] train_loss: 1.440 train_accuracy: 0.459 test_accuracy: 0.442\n",
            "[2,   815] train_loss: 1.497 train_accuracy: 0.460 test_accuracy: 0.440\n",
            "[2,   820] train_loss: 1.430 train_accuracy: 0.461 test_accuracy: 0.440\n",
            "[2,   825] train_loss: 1.616 train_accuracy: 0.466 test_accuracy: 0.449\n",
            "[2,   830] train_loss: 1.630 train_accuracy: 0.455 test_accuracy: 0.442\n",
            "[2,   835] train_loss: 1.684 train_accuracy: 0.468 test_accuracy: 0.447\n",
            "[2,   840] train_loss: 1.581 train_accuracy: 0.473 test_accuracy: 0.458\n",
            "[2,   845] train_loss: 1.546 train_accuracy: 0.465 test_accuracy: 0.453\n",
            "[2,   850] train_loss: 1.567 train_accuracy: 0.471 test_accuracy: 0.453\n",
            "[2,   855] train_loss: 1.497 train_accuracy: 0.469 test_accuracy: 0.456\n",
            "[2,   860] train_loss: 1.550 train_accuracy: 0.477 test_accuracy: 0.466\n",
            "[2,   865] train_loss: 1.529 train_accuracy: 0.479 test_accuracy: 0.467\n",
            "[2,   870] train_loss: 1.605 train_accuracy: 0.479 test_accuracy: 0.473\n",
            "[2,   875] train_loss: 1.434 train_accuracy: 0.473 test_accuracy: 0.463\n",
            "[2,   880] train_loss: 1.488 train_accuracy: 0.479 test_accuracy: 0.465\n",
            "[2,   885] train_loss: 1.521 train_accuracy: 0.479 test_accuracy: 0.463\n",
            "[2,   890] train_loss: 1.345 train_accuracy: 0.483 test_accuracy: 0.465\n",
            "[2,   895] train_loss: 1.754 train_accuracy: 0.474 test_accuracy: 0.454\n",
            "[2,   900] train_loss: 1.525 train_accuracy: 0.460 test_accuracy: 0.441\n",
            "[2,   905] train_loss: 1.493 train_accuracy: 0.476 test_accuracy: 0.459\n",
            "[2,   910] train_loss: 1.591 train_accuracy: 0.490 test_accuracy: 0.467\n",
            "[2,   915] train_loss: 1.517 train_accuracy: 0.488 test_accuracy: 0.462\n",
            "[2,   920] train_loss: 1.499 train_accuracy: 0.491 test_accuracy: 0.468\n",
            "[2,   925] train_loss: 1.664 train_accuracy: 0.496 test_accuracy: 0.470\n",
            "[2,   930] train_loss: 1.553 train_accuracy: 0.468 test_accuracy: 0.440\n",
            "[2,   935] train_loss: 1.632 train_accuracy: 0.485 test_accuracy: 0.466\n",
            "[2,   940] train_loss: 1.523 train_accuracy: 0.477 test_accuracy: 0.463\n",
            "[2,   945] train_loss: 1.545 train_accuracy: 0.482 test_accuracy: 0.463\n",
            "[2,   950] train_loss: 1.566 train_accuracy: 0.475 test_accuracy: 0.462\n",
            "[2,   955] train_loss: 1.567 train_accuracy: 0.459 test_accuracy: 0.449\n",
            "[2,   960] train_loss: 1.586 train_accuracy: 0.464 test_accuracy: 0.453\n",
            "[2,   965] train_loss: 1.441 train_accuracy: 0.475 test_accuracy: 0.461\n",
            "[2,   970] train_loss: 1.487 train_accuracy: 0.461 test_accuracy: 0.446\n",
            "[2,   975] train_loss: 1.543 train_accuracy: 0.469 test_accuracy: 0.459\n",
            "[2,   980] train_loss: 1.569 train_accuracy: 0.483 test_accuracy: 0.462\n",
            "[2,   985] train_loss: 1.597 train_accuracy: 0.476 test_accuracy: 0.454\n",
            "[2,   990] train_loss: 1.613 train_accuracy: 0.477 test_accuracy: 0.451\n",
            "[2,   995] train_loss: 1.573 train_accuracy: 0.477 test_accuracy: 0.461\n",
            "[2,  1000] train_loss: 1.541 train_accuracy: 0.496 test_accuracy: 0.473\n",
            "[2,  1005] train_loss: 1.574 train_accuracy: 0.495 test_accuracy: 0.474\n",
            "[2,  1010] train_loss: 1.437 train_accuracy: 0.494 test_accuracy: 0.474\n",
            "[2,  1015] train_loss: 1.558 train_accuracy: 0.486 test_accuracy: 0.465\n",
            "[2,  1020] train_loss: 1.491 train_accuracy: 0.482 test_accuracy: 0.462\n",
            "[2,  1025] train_loss: 1.450 train_accuracy: 0.482 test_accuracy: 0.457\n",
            "[2,  1030] train_loss: 1.502 train_accuracy: 0.488 test_accuracy: 0.466\n",
            "[2,  1035] train_loss: 1.516 train_accuracy: 0.484 test_accuracy: 0.461\n",
            "[2,  1040] train_loss: 1.618 train_accuracy: 0.495 test_accuracy: 0.469\n",
            "[2,  1045] train_loss: 1.532 train_accuracy: 0.487 test_accuracy: 0.459\n",
            "[2,  1050] train_loss: 1.521 train_accuracy: 0.496 test_accuracy: 0.470\n",
            "[2,  1055] train_loss: 1.490 train_accuracy: 0.485 test_accuracy: 0.458\n",
            "[2,  1060] train_loss: 1.432 train_accuracy: 0.498 test_accuracy: 0.474\n",
            "[2,  1065] train_loss: 1.671 train_accuracy: 0.485 test_accuracy: 0.468\n",
            "[2,  1070] train_loss: 1.572 train_accuracy: 0.490 test_accuracy: 0.470\n",
            "[2,  1075] train_loss: 1.436 train_accuracy: 0.491 test_accuracy: 0.468\n",
            "[2,  1080] train_loss: 1.530 train_accuracy: 0.489 test_accuracy: 0.461\n",
            "[2,  1085] train_loss: 1.536 train_accuracy: 0.478 test_accuracy: 0.461\n",
            "[2,  1090] train_loss: 1.417 train_accuracy: 0.478 test_accuracy: 0.456\n",
            "[2,  1095] train_loss: 1.588 train_accuracy: 0.482 test_accuracy: 0.466\n",
            "[2,  1100] train_loss: 1.448 train_accuracy: 0.463 test_accuracy: 0.449\n",
            "[2,  1105] train_loss: 1.692 train_accuracy: 0.471 test_accuracy: 0.454\n",
            "[2,  1110] train_loss: 1.542 train_accuracy: 0.481 test_accuracy: 0.466\n",
            "[2,  1115] train_loss: 1.491 train_accuracy: 0.478 test_accuracy: 0.453\n",
            "[2,  1120] train_loss: 1.593 train_accuracy: 0.474 test_accuracy: 0.454\n",
            "[2,  1125] train_loss: 1.635 train_accuracy: 0.485 test_accuracy: 0.466\n",
            "[2,  1130] train_loss: 1.420 train_accuracy: 0.483 test_accuracy: 0.456\n",
            "[2,  1135] train_loss: 1.598 train_accuracy: 0.477 test_accuracy: 0.448\n",
            "[2,  1140] train_loss: 1.536 train_accuracy: 0.473 test_accuracy: 0.447\n",
            "[2,  1145] train_loss: 1.768 train_accuracy: 0.479 test_accuracy: 0.453\n",
            "[2,  1150] train_loss: 1.519 train_accuracy: 0.488 test_accuracy: 0.451\n",
            "[2,  1155] train_loss: 1.584 train_accuracy: 0.467 test_accuracy: 0.441\n",
            "[2,  1160] train_loss: 1.639 train_accuracy: 0.481 test_accuracy: 0.457\n",
            "[2,  1165] train_loss: 1.631 train_accuracy: 0.495 test_accuracy: 0.479\n",
            "[2,  1170] train_loss: 1.704 train_accuracy: 0.491 test_accuracy: 0.473\n",
            "[2,  1175] train_loss: 1.426 train_accuracy: 0.492 test_accuracy: 0.468\n",
            "[2,  1180] train_loss: 1.483 train_accuracy: 0.492 test_accuracy: 0.467\n",
            "[2,  1185] train_loss: 1.594 train_accuracy: 0.486 test_accuracy: 0.463\n",
            "[2,  1190] train_loss: 1.631 train_accuracy: 0.495 test_accuracy: 0.470\n",
            "[2,  1195] train_loss: 1.471 train_accuracy: 0.491 test_accuracy: 0.464\n",
            "[2,  1200] train_loss: 1.565 train_accuracy: 0.488 test_accuracy: 0.461\n",
            "[2,  1205] train_loss: 1.417 train_accuracy: 0.486 test_accuracy: 0.461\n",
            "[2,  1210] train_loss: 1.562 train_accuracy: 0.490 test_accuracy: 0.466\n",
            "[2,  1215] train_loss: 1.528 train_accuracy: 0.477 test_accuracy: 0.455\n",
            "[2,  1220] train_loss: 1.439 train_accuracy: 0.481 test_accuracy: 0.461\n",
            "[2,  1225] train_loss: 1.594 train_accuracy: 0.486 test_accuracy: 0.466\n",
            "[2,  1230] train_loss: 1.462 train_accuracy: 0.491 test_accuracy: 0.472\n",
            "[2,  1235] train_loss: 1.562 train_accuracy: 0.487 test_accuracy: 0.468\n",
            "[2,  1240] train_loss: 1.570 train_accuracy: 0.483 test_accuracy: 0.456\n",
            "[2,  1245] train_loss: 1.531 train_accuracy: 0.484 test_accuracy: 0.457\n",
            "[3,     5] train_loss: 1.542 train_accuracy: 0.501 test_accuracy: 0.468\n",
            "[3,    10] train_loss: 1.523 train_accuracy: 0.496 test_accuracy: 0.467\n",
            "[3,    15] train_loss: 1.490 train_accuracy: 0.504 test_accuracy: 0.476\n",
            "[3,    20] train_loss: 1.376 train_accuracy: 0.506 test_accuracy: 0.469\n",
            "[3,    25] train_loss: 1.395 train_accuracy: 0.500 test_accuracy: 0.466\n",
            "[3,    30] train_loss: 1.287 train_accuracy: 0.508 test_accuracy: 0.480\n",
            "[3,    35] train_loss: 1.415 train_accuracy: 0.497 test_accuracy: 0.474\n",
            "[3,    40] train_loss: 1.512 train_accuracy: 0.489 test_accuracy: 0.469\n",
            "[3,    45] train_loss: 1.420 train_accuracy: 0.497 test_accuracy: 0.479\n",
            "[3,    50] train_loss: 1.542 train_accuracy: 0.506 test_accuracy: 0.482\n",
            "[3,    55] train_loss: 1.474 train_accuracy: 0.508 test_accuracy: 0.480\n",
            "[3,    60] train_loss: 1.323 train_accuracy: 0.495 test_accuracy: 0.465\n",
            "[3,    65] train_loss: 1.358 train_accuracy: 0.492 test_accuracy: 0.470\n",
            "[3,    70] train_loss: 1.555 train_accuracy: 0.490 test_accuracy: 0.470\n",
            "[3,    75] train_loss: 1.390 train_accuracy: 0.498 test_accuracy: 0.479\n",
            "[3,    80] train_loss: 1.407 train_accuracy: 0.494 test_accuracy: 0.468\n",
            "[3,    85] train_loss: 1.650 train_accuracy: 0.495 test_accuracy: 0.466\n",
            "[3,    90] train_loss: 1.570 train_accuracy: 0.498 test_accuracy: 0.471\n",
            "[3,    95] train_loss: 1.403 train_accuracy: 0.494 test_accuracy: 0.459\n",
            "[3,   100] train_loss: 1.399 train_accuracy: 0.508 test_accuracy: 0.467\n",
            "[3,   105] train_loss: 1.424 train_accuracy: 0.518 test_accuracy: 0.476\n",
            "[3,   110] train_loss: 1.456 train_accuracy: 0.501 test_accuracy: 0.465\n",
            "[3,   115] train_loss: 1.663 train_accuracy: 0.485 test_accuracy: 0.459\n",
            "[3,   120] train_loss: 1.567 train_accuracy: 0.472 test_accuracy: 0.448\n",
            "[3,   125] train_loss: 1.448 train_accuracy: 0.490 test_accuracy: 0.465\n",
            "[3,   130] train_loss: 1.393 train_accuracy: 0.491 test_accuracy: 0.463\n",
            "[3,   135] train_loss: 1.469 train_accuracy: 0.489 test_accuracy: 0.465\n",
            "[3,   140] train_loss: 1.388 train_accuracy: 0.497 test_accuracy: 0.471\n",
            "[3,   145] train_loss: 1.383 train_accuracy: 0.503 test_accuracy: 0.474\n",
            "[3,   150] train_loss: 1.452 train_accuracy: 0.509 test_accuracy: 0.479\n",
            "[3,   155] train_loss: 1.396 train_accuracy: 0.491 test_accuracy: 0.471\n",
            "[3,   160] train_loss: 1.602 train_accuracy: 0.487 test_accuracy: 0.464\n",
            "[3,   165] train_loss: 1.438 train_accuracy: 0.475 test_accuracy: 0.456\n",
            "[3,   170] train_loss: 1.496 train_accuracy: 0.480 test_accuracy: 0.453\n",
            "[3,   175] train_loss: 1.554 train_accuracy: 0.479 test_accuracy: 0.464\n",
            "[3,   180] train_loss: 1.527 train_accuracy: 0.473 test_accuracy: 0.452\n",
            "[3,   185] train_loss: 1.486 train_accuracy: 0.486 test_accuracy: 0.466\n",
            "[3,   190] train_loss: 1.472 train_accuracy: 0.483 test_accuracy: 0.462\n",
            "[3,   195] train_loss: 1.489 train_accuracy: 0.475 test_accuracy: 0.452\n",
            "[3,   200] train_loss: 1.583 train_accuracy: 0.487 test_accuracy: 0.466\n",
            "[3,   205] train_loss: 1.578 train_accuracy: 0.488 test_accuracy: 0.460\n",
            "[3,   210] train_loss: 1.494 train_accuracy: 0.503 test_accuracy: 0.473\n",
            "[3,   215] train_loss: 1.496 train_accuracy: 0.490 test_accuracy: 0.462\n",
            "[3,   220] train_loss: 1.539 train_accuracy: 0.501 test_accuracy: 0.472\n",
            "[3,   225] train_loss: 1.416 train_accuracy: 0.497 test_accuracy: 0.475\n",
            "[3,   230] train_loss: 1.393 train_accuracy: 0.494 test_accuracy: 0.471\n",
            "[3,   235] train_loss: 1.391 train_accuracy: 0.493 test_accuracy: 0.467\n",
            "[3,   240] train_loss: 1.541 train_accuracy: 0.503 test_accuracy: 0.472\n",
            "[3,   245] train_loss: 1.411 train_accuracy: 0.500 test_accuracy: 0.470\n",
            "[3,   250] train_loss: 1.471 train_accuracy: 0.500 test_accuracy: 0.469\n",
            "[3,   255] train_loss: 1.443 train_accuracy: 0.491 test_accuracy: 0.457\n",
            "[3,   260] train_loss: 1.429 train_accuracy: 0.493 test_accuracy: 0.459\n",
            "[3,   265] train_loss: 1.526 train_accuracy: 0.494 test_accuracy: 0.461\n",
            "[3,   270] train_loss: 1.413 train_accuracy: 0.491 test_accuracy: 0.460\n",
            "[3,   275] train_loss: 1.354 train_accuracy: 0.483 test_accuracy: 0.460\n",
            "[3,   280] train_loss: 1.466 train_accuracy: 0.492 test_accuracy: 0.472\n",
            "[3,   285] train_loss: 1.551 train_accuracy: 0.490 test_accuracy: 0.461\n",
            "[3,   290] train_loss: 1.523 train_accuracy: 0.488 test_accuracy: 0.458\n",
            "[3,   295] train_loss: 1.439 train_accuracy: 0.495 test_accuracy: 0.467\n",
            "[3,   300] train_loss: 1.473 train_accuracy: 0.505 test_accuracy: 0.476\n",
            "[3,   305] train_loss: 1.456 train_accuracy: 0.509 test_accuracy: 0.470\n",
            "[3,   310] train_loss: 1.500 train_accuracy: 0.505 test_accuracy: 0.478\n",
            "[3,   315] train_loss: 1.474 train_accuracy: 0.505 test_accuracy: 0.471\n",
            "[3,   320] train_loss: 1.407 train_accuracy: 0.493 test_accuracy: 0.463\n",
            "[3,   325] train_loss: 1.473 train_accuracy: 0.495 test_accuracy: 0.468\n",
            "[3,   330] train_loss: 1.588 train_accuracy: 0.493 test_accuracy: 0.472\n",
            "[3,   335] train_loss: 1.407 train_accuracy: 0.498 test_accuracy: 0.475\n",
            "[3,   340] train_loss: 1.303 train_accuracy: 0.507 test_accuracy: 0.480\n",
            "[3,   345] train_loss: 1.374 train_accuracy: 0.491 test_accuracy: 0.467\n",
            "[3,   350] train_loss: 1.385 train_accuracy: 0.483 test_accuracy: 0.460\n",
            "[3,   355] train_loss: 1.462 train_accuracy: 0.495 test_accuracy: 0.469\n",
            "[3,   360] train_loss: 1.414 train_accuracy: 0.495 test_accuracy: 0.469\n",
            "[3,   365] train_loss: 1.577 train_accuracy: 0.499 test_accuracy: 0.467\n",
            "[3,   370] train_loss: 1.405 train_accuracy: 0.481 test_accuracy: 0.456\n",
            "[3,   375] train_loss: 1.398 train_accuracy: 0.493 test_accuracy: 0.470\n",
            "[3,   380] train_loss: 1.370 train_accuracy: 0.494 test_accuracy: 0.473\n",
            "[3,   385] train_loss: 1.556 train_accuracy: 0.499 test_accuracy: 0.476\n",
            "[3,   390] train_loss: 1.412 train_accuracy: 0.513 test_accuracy: 0.483\n",
            "[3,   395] train_loss: 1.371 train_accuracy: 0.500 test_accuracy: 0.475\n",
            "[3,   400] train_loss: 1.526 train_accuracy: 0.507 test_accuracy: 0.477\n",
            "[3,   405] train_loss: 1.437 train_accuracy: 0.488 test_accuracy: 0.461\n",
            "[3,   410] train_loss: 1.564 train_accuracy: 0.490 test_accuracy: 0.467\n",
            "[3,   415] train_loss: 1.492 train_accuracy: 0.494 test_accuracy: 0.476\n",
            "[3,   420] train_loss: 1.368 train_accuracy: 0.499 test_accuracy: 0.485\n",
            "[3,   425] train_loss: 1.557 train_accuracy: 0.507 test_accuracy: 0.478\n",
            "[3,   430] train_loss: 1.328 train_accuracy: 0.511 test_accuracy: 0.486\n",
            "[3,   435] train_loss: 1.405 train_accuracy: 0.503 test_accuracy: 0.481\n",
            "[3,   440] train_loss: 1.443 train_accuracy: 0.498 test_accuracy: 0.476\n",
            "[3,   445] train_loss: 1.483 train_accuracy: 0.493 test_accuracy: 0.469\n",
            "[3,   450] train_loss: 1.472 train_accuracy: 0.500 test_accuracy: 0.475\n",
            "[3,   455] train_loss: 1.465 train_accuracy: 0.494 test_accuracy: 0.470\n",
            "[3,   460] train_loss: 1.575 train_accuracy: 0.504 test_accuracy: 0.476\n",
            "[3,   465] train_loss: 1.639 train_accuracy: 0.507 test_accuracy: 0.474\n",
            "[3,   470] train_loss: 1.443 train_accuracy: 0.517 test_accuracy: 0.484\n",
            "[3,   475] train_loss: 1.427 train_accuracy: 0.510 test_accuracy: 0.485\n",
            "[3,   480] train_loss: 1.469 train_accuracy: 0.511 test_accuracy: 0.489\n",
            "[3,   485] train_loss: 1.411 train_accuracy: 0.512 test_accuracy: 0.490\n",
            "[3,   490] train_loss: 1.577 train_accuracy: 0.505 test_accuracy: 0.477\n",
            "[3,   495] train_loss: 1.425 train_accuracy: 0.503 test_accuracy: 0.476\n",
            "[3,   500] train_loss: 1.441 train_accuracy: 0.499 test_accuracy: 0.479\n",
            "[3,   505] train_loss: 1.462 train_accuracy: 0.489 test_accuracy: 0.472\n",
            "[3,   510] train_loss: 1.491 train_accuracy: 0.500 test_accuracy: 0.469\n",
            "[3,   515] train_loss: 1.616 train_accuracy: 0.495 test_accuracy: 0.461\n",
            "[3,   520] train_loss: 1.457 train_accuracy: 0.499 test_accuracy: 0.460\n",
            "[3,   525] train_loss: 1.484 train_accuracy: 0.511 test_accuracy: 0.479\n",
            "[3,   530] train_loss: 1.463 train_accuracy: 0.505 test_accuracy: 0.479\n",
            "[3,   535] train_loss: 1.357 train_accuracy: 0.502 test_accuracy: 0.479\n",
            "[3,   540] train_loss: 1.489 train_accuracy: 0.507 test_accuracy: 0.485\n",
            "[3,   545] train_loss: 1.445 train_accuracy: 0.500 test_accuracy: 0.471\n",
            "[3,   550] train_loss: 1.386 train_accuracy: 0.490 test_accuracy: 0.464\n",
            "[3,   555] train_loss: 1.435 train_accuracy: 0.491 test_accuracy: 0.466\n",
            "[3,   560] train_loss: 1.492 train_accuracy: 0.499 test_accuracy: 0.476\n",
            "[3,   565] train_loss: 1.490 train_accuracy: 0.515 test_accuracy: 0.483\n",
            "[3,   570] train_loss: 1.623 train_accuracy: 0.506 test_accuracy: 0.475\n",
            "[3,   575] train_loss: 1.449 train_accuracy: 0.513 test_accuracy: 0.479\n",
            "[3,   580] train_loss: 1.458 train_accuracy: 0.495 test_accuracy: 0.467\n",
            "[3,   585] train_loss: 1.436 train_accuracy: 0.488 test_accuracy: 0.463\n",
            "[3,   590] train_loss: 1.418 train_accuracy: 0.502 test_accuracy: 0.471\n",
            "[3,   595] train_loss: 1.365 train_accuracy: 0.506 test_accuracy: 0.472\n",
            "[3,   600] train_loss: 1.549 train_accuracy: 0.519 test_accuracy: 0.486\n",
            "[3,   605] train_loss: 1.538 train_accuracy: 0.508 test_accuracy: 0.480\n",
            "[3,   610] train_loss: 1.509 train_accuracy: 0.506 test_accuracy: 0.478\n",
            "[3,   615] train_loss: 1.501 train_accuracy: 0.516 test_accuracy: 0.484\n",
            "[3,   620] train_loss: 1.443 train_accuracy: 0.509 test_accuracy: 0.486\n",
            "[3,   625] train_loss: 1.501 train_accuracy: 0.510 test_accuracy: 0.481\n",
            "[3,   630] train_loss: 1.442 train_accuracy: 0.517 test_accuracy: 0.488\n",
            "[3,   635] train_loss: 1.395 train_accuracy: 0.519 test_accuracy: 0.489\n",
            "[3,   640] train_loss: 1.461 train_accuracy: 0.513 test_accuracy: 0.485\n",
            "[3,   645] train_loss: 1.341 train_accuracy: 0.521 test_accuracy: 0.489\n",
            "[3,   650] train_loss: 1.436 train_accuracy: 0.519 test_accuracy: 0.488\n",
            "[3,   655] train_loss: 1.390 train_accuracy: 0.508 test_accuracy: 0.480\n",
            "[3,   660] train_loss: 1.537 train_accuracy: 0.524 test_accuracy: 0.486\n",
            "[3,   665] train_loss: 1.506 train_accuracy: 0.506 test_accuracy: 0.469\n",
            "[3,   670] train_loss: 1.588 train_accuracy: 0.507 test_accuracy: 0.463\n",
            "[3,   675] train_loss: 1.442 train_accuracy: 0.516 test_accuracy: 0.484\n",
            "[3,   680] train_loss: 1.402 train_accuracy: 0.507 test_accuracy: 0.483\n",
            "[3,   685] train_loss: 1.504 train_accuracy: 0.505 test_accuracy: 0.483\n",
            "[3,   690] train_loss: 1.369 train_accuracy: 0.502 test_accuracy: 0.479\n",
            "[3,   695] train_loss: 1.302 train_accuracy: 0.515 test_accuracy: 0.488\n",
            "[3,   700] train_loss: 1.449 train_accuracy: 0.513 test_accuracy: 0.481\n",
            "[3,   705] train_loss: 1.296 train_accuracy: 0.510 test_accuracy: 0.478\n",
            "[3,   710] train_loss: 1.578 train_accuracy: 0.517 test_accuracy: 0.482\n",
            "[3,   715] train_loss: 1.418 train_accuracy: 0.496 test_accuracy: 0.467\n",
            "[3,   720] train_loss: 1.544 train_accuracy: 0.506 test_accuracy: 0.471\n",
            "[3,   725] train_loss: 1.619 train_accuracy: 0.509 test_accuracy: 0.464\n",
            "[3,   730] train_loss: 1.640 train_accuracy: 0.502 test_accuracy: 0.459\n",
            "[3,   735] train_loss: 1.471 train_accuracy: 0.510 test_accuracy: 0.468\n",
            "[3,   740] train_loss: 1.501 train_accuracy: 0.511 test_accuracy: 0.473\n",
            "[3,   745] train_loss: 1.426 train_accuracy: 0.512 test_accuracy: 0.476\n",
            "[3,   750] train_loss: 1.414 train_accuracy: 0.513 test_accuracy: 0.477\n",
            "[3,   755] train_loss: 1.346 train_accuracy: 0.499 test_accuracy: 0.465\n",
            "[3,   760] train_loss: 1.331 train_accuracy: 0.490 test_accuracy: 0.460\n",
            "[3,   765] train_loss: 1.383 train_accuracy: 0.496 test_accuracy: 0.467\n",
            "[3,   770] train_loss: 1.610 train_accuracy: 0.508 test_accuracy: 0.474\n",
            "[3,   775] train_loss: 1.378 train_accuracy: 0.518 test_accuracy: 0.475\n",
            "[3,   780] train_loss: 1.362 train_accuracy: 0.513 test_accuracy: 0.475\n",
            "[3,   785] train_loss: 1.447 train_accuracy: 0.509 test_accuracy: 0.474\n",
            "[3,   790] train_loss: 1.517 train_accuracy: 0.513 test_accuracy: 0.478\n",
            "[3,   795] train_loss: 1.348 train_accuracy: 0.519 test_accuracy: 0.482\n",
            "[3,   800] train_loss: 1.441 train_accuracy: 0.516 test_accuracy: 0.475\n",
            "[3,   805] train_loss: 1.488 train_accuracy: 0.510 test_accuracy: 0.479\n",
            "[3,   810] train_loss: 1.539 train_accuracy: 0.520 test_accuracy: 0.489\n",
            "[3,   815] train_loss: 1.378 train_accuracy: 0.524 test_accuracy: 0.493\n",
            "[3,   820] train_loss: 1.401 train_accuracy: 0.513 test_accuracy: 0.481\n",
            "[3,   825] train_loss: 1.504 train_accuracy: 0.517 test_accuracy: 0.480\n",
            "[3,   830] train_loss: 1.365 train_accuracy: 0.514 test_accuracy: 0.478\n",
            "[3,   835] train_loss: 1.441 train_accuracy: 0.512 test_accuracy: 0.471\n",
            "[3,   840] train_loss: 1.518 train_accuracy: 0.510 test_accuracy: 0.466\n",
            "[3,   845] train_loss: 1.469 train_accuracy: 0.516 test_accuracy: 0.473\n",
            "[3,   850] train_loss: 1.389 train_accuracy: 0.516 test_accuracy: 0.475\n",
            "[3,   855] train_loss: 1.454 train_accuracy: 0.511 test_accuracy: 0.470\n",
            "[3,   860] train_loss: 1.519 train_accuracy: 0.524 test_accuracy: 0.482\n",
            "[3,   865] train_loss: 1.355 train_accuracy: 0.511 test_accuracy: 0.475\n",
            "[3,   870] train_loss: 1.525 train_accuracy: 0.501 test_accuracy: 0.474\n",
            "[3,   875] train_loss: 1.509 train_accuracy: 0.507 test_accuracy: 0.478\n",
            "[3,   880] train_loss: 1.436 train_accuracy: 0.512 test_accuracy: 0.477\n",
            "[3,   885] train_loss: 1.502 train_accuracy: 0.512 test_accuracy: 0.472\n",
            "[3,   890] train_loss: 1.447 train_accuracy: 0.509 test_accuracy: 0.474\n",
            "[3,   895] train_loss: 1.436 train_accuracy: 0.517 test_accuracy: 0.485\n",
            "[3,   900] train_loss: 1.390 train_accuracy: 0.510 test_accuracy: 0.474\n",
            "[3,   905] train_loss: 1.463 train_accuracy: 0.505 test_accuracy: 0.473\n",
            "[3,   910] train_loss: 1.400 train_accuracy: 0.507 test_accuracy: 0.477\n",
            "[3,   915] train_loss: 1.583 train_accuracy: 0.516 test_accuracy: 0.477\n",
            "[3,   920] train_loss: 1.443 train_accuracy: 0.530 test_accuracy: 0.491\n",
            "[3,   925] train_loss: 1.485 train_accuracy: 0.531 test_accuracy: 0.496\n",
            "[3,   930] train_loss: 1.508 train_accuracy: 0.509 test_accuracy: 0.478\n",
            "[3,   935] train_loss: 1.537 train_accuracy: 0.511 test_accuracy: 0.483\n",
            "[3,   940] train_loss: 1.518 train_accuracy: 0.513 test_accuracy: 0.484\n",
            "[3,   945] train_loss: 1.375 train_accuracy: 0.512 test_accuracy: 0.476\n",
            "[3,   950] train_loss: 1.456 train_accuracy: 0.509 test_accuracy: 0.474\n",
            "[3,   955] train_loss: 1.494 train_accuracy: 0.517 test_accuracy: 0.477\n",
            "[3,   960] train_loss: 1.316 train_accuracy: 0.517 test_accuracy: 0.480\n",
            "[3,   965] train_loss: 1.397 train_accuracy: 0.487 test_accuracy: 0.460\n",
            "[3,   970] train_loss: 1.536 train_accuracy: 0.497 test_accuracy: 0.464\n",
            "[3,   975] train_loss: 1.576 train_accuracy: 0.512 test_accuracy: 0.466\n",
            "[3,   980] train_loss: 1.362 train_accuracy: 0.507 test_accuracy: 0.463\n",
            "[3,   985] train_loss: 1.323 train_accuracy: 0.509 test_accuracy: 0.471\n",
            "[3,   990] train_loss: 1.444 train_accuracy: 0.516 test_accuracy: 0.482\n",
            "[3,   995] train_loss: 1.313 train_accuracy: 0.517 test_accuracy: 0.486\n",
            "[3,  1000] train_loss: 1.447 train_accuracy: 0.523 test_accuracy: 0.492\n",
            "[3,  1005] train_loss: 1.541 train_accuracy: 0.529 test_accuracy: 0.499\n",
            "[3,  1010] train_loss: 1.540 train_accuracy: 0.514 test_accuracy: 0.478\n",
            "[3,  1015] train_loss: 1.394 train_accuracy: 0.511 test_accuracy: 0.477\n",
            "[3,  1020] train_loss: 1.434 train_accuracy: 0.520 test_accuracy: 0.485\n",
            "[3,  1025] train_loss: 1.441 train_accuracy: 0.515 test_accuracy: 0.484\n",
            "[3,  1030] train_loss: 1.525 train_accuracy: 0.509 test_accuracy: 0.478\n",
            "[3,  1035] train_loss: 1.390 train_accuracy: 0.518 test_accuracy: 0.484\n",
            "[3,  1040] train_loss: 1.442 train_accuracy: 0.519 test_accuracy: 0.482\n",
            "[3,  1045] train_loss: 1.411 train_accuracy: 0.509 test_accuracy: 0.472\n",
            "[3,  1050] train_loss: 1.445 train_accuracy: 0.521 test_accuracy: 0.480\n",
            "[3,  1055] train_loss: 1.499 train_accuracy: 0.521 test_accuracy: 0.481\n",
            "[3,  1060] train_loss: 1.490 train_accuracy: 0.517 test_accuracy: 0.474\n",
            "[3,  1065] train_loss: 1.422 train_accuracy: 0.515 test_accuracy: 0.475\n",
            "[3,  1070] train_loss: 1.516 train_accuracy: 0.505 test_accuracy: 0.465\n",
            "[3,  1075] train_loss: 1.439 train_accuracy: 0.509 test_accuracy: 0.474\n",
            "[3,  1080] train_loss: 1.398 train_accuracy: 0.513 test_accuracy: 0.481\n",
            "[3,  1085] train_loss: 1.370 train_accuracy: 0.513 test_accuracy: 0.478\n",
            "[3,  1090] train_loss: 1.595 train_accuracy: 0.522 test_accuracy: 0.490\n",
            "[3,  1095] train_loss: 1.255 train_accuracy: 0.533 test_accuracy: 0.497\n",
            "[3,  1100] train_loss: 1.426 train_accuracy: 0.523 test_accuracy: 0.490\n",
            "[3,  1105] train_loss: 1.445 train_accuracy: 0.530 test_accuracy: 0.497\n",
            "[3,  1110] train_loss: 1.500 train_accuracy: 0.525 test_accuracy: 0.484\n",
            "[3,  1115] train_loss: 1.427 train_accuracy: 0.521 test_accuracy: 0.475\n",
            "[3,  1120] train_loss: 1.431 train_accuracy: 0.521 test_accuracy: 0.483\n",
            "[3,  1125] train_loss: 1.449 train_accuracy: 0.528 test_accuracy: 0.491\n",
            "[3,  1130] train_loss: 1.427 train_accuracy: 0.532 test_accuracy: 0.495\n",
            "[3,  1135] train_loss: 1.392 train_accuracy: 0.533 test_accuracy: 0.494\n",
            "[3,  1140] train_loss: 1.420 train_accuracy: 0.521 test_accuracy: 0.489\n",
            "[3,  1145] train_loss: 1.409 train_accuracy: 0.523 test_accuracy: 0.492\n",
            "[3,  1150] train_loss: 1.564 train_accuracy: 0.533 test_accuracy: 0.496\n",
            "[3,  1155] train_loss: 1.393 train_accuracy: 0.520 test_accuracy: 0.481\n",
            "[3,  1160] train_loss: 1.470 train_accuracy: 0.526 test_accuracy: 0.492\n",
            "[3,  1165] train_loss: 1.386 train_accuracy: 0.526 test_accuracy: 0.489\n",
            "[3,  1170] train_loss: 1.402 train_accuracy: 0.524 test_accuracy: 0.487\n",
            "[3,  1175] train_loss: 1.414 train_accuracy: 0.515 test_accuracy: 0.484\n",
            "[3,  1180] train_loss: 1.343 train_accuracy: 0.510 test_accuracy: 0.477\n",
            "[3,  1185] train_loss: 1.568 train_accuracy: 0.508 test_accuracy: 0.473\n",
            "[3,  1190] train_loss: 1.418 train_accuracy: 0.517 test_accuracy: 0.481\n",
            "[3,  1195] train_loss: 1.481 train_accuracy: 0.520 test_accuracy: 0.482\n",
            "[3,  1200] train_loss: 1.470 train_accuracy: 0.509 test_accuracy: 0.474\n",
            "[3,  1205] train_loss: 1.523 train_accuracy: 0.496 test_accuracy: 0.470\n",
            "[3,  1210] train_loss: 1.528 train_accuracy: 0.496 test_accuracy: 0.467\n",
            "[3,  1215] train_loss: 1.402 train_accuracy: 0.513 test_accuracy: 0.477\n",
            "[3,  1220] train_loss: 1.486 train_accuracy: 0.515 test_accuracy: 0.477\n",
            "[3,  1225] train_loss: 1.578 train_accuracy: 0.505 test_accuracy: 0.469\n",
            "[3,  1230] train_loss: 1.622 train_accuracy: 0.510 test_accuracy: 0.471\n",
            "[3,  1235] train_loss: 1.458 train_accuracy: 0.527 test_accuracy: 0.490\n",
            "[3,  1240] train_loss: 1.349 train_accuracy: 0.526 test_accuracy: 0.493\n",
            "[3,  1245] train_loss: 1.501 train_accuracy: 0.521 test_accuracy: 0.486\n",
            "[4,     5] train_loss: 1.390 train_accuracy: 0.521 test_accuracy: 0.485\n",
            "[4,    10] train_loss: 1.417 train_accuracy: 0.510 test_accuracy: 0.476\n",
            "[4,    15] train_loss: 1.503 train_accuracy: 0.522 test_accuracy: 0.485\n",
            "[4,    20] train_loss: 1.339 train_accuracy: 0.525 test_accuracy: 0.484\n",
            "[4,    25] train_loss: 1.317 train_accuracy: 0.517 test_accuracy: 0.480\n",
            "[4,    30] train_loss: 1.272 train_accuracy: 0.525 test_accuracy: 0.489\n",
            "[4,    35] train_loss: 1.385 train_accuracy: 0.532 test_accuracy: 0.486\n",
            "[4,    40] train_loss: 1.354 train_accuracy: 0.526 test_accuracy: 0.480\n",
            "[4,    45] train_loss: 1.320 train_accuracy: 0.528 test_accuracy: 0.486\n",
            "[4,    50] train_loss: 1.417 train_accuracy: 0.520 test_accuracy: 0.478\n",
            "[4,    55] train_loss: 1.237 train_accuracy: 0.520 test_accuracy: 0.481\n",
            "[4,    60] train_loss: 1.362 train_accuracy: 0.520 test_accuracy: 0.483\n",
            "[4,    65] train_loss: 1.526 train_accuracy: 0.520 test_accuracy: 0.485\n",
            "[4,    70] train_loss: 1.286 train_accuracy: 0.527 test_accuracy: 0.492\n",
            "[4,    75] train_loss: 1.320 train_accuracy: 0.525 test_accuracy: 0.483\n",
            "[4,    80] train_loss: 1.329 train_accuracy: 0.522 test_accuracy: 0.489\n",
            "[4,    85] train_loss: 1.417 train_accuracy: 0.527 test_accuracy: 0.493\n",
            "[4,    90] train_loss: 1.250 train_accuracy: 0.535 test_accuracy: 0.496\n",
            "[4,    95] train_loss: 1.438 train_accuracy: 0.523 test_accuracy: 0.478\n",
            "[4,   100] train_loss: 1.293 train_accuracy: 0.538 test_accuracy: 0.490\n",
            "[4,   105] train_loss: 1.372 train_accuracy: 0.538 test_accuracy: 0.497\n",
            "[4,   110] train_loss: 1.364 train_accuracy: 0.526 test_accuracy: 0.487\n",
            "[4,   115] train_loss: 1.381 train_accuracy: 0.531 test_accuracy: 0.496\n",
            "[4,   120] train_loss: 1.359 train_accuracy: 0.525 test_accuracy: 0.491\n",
            "[4,   125] train_loss: 1.350 train_accuracy: 0.519 test_accuracy: 0.485\n",
            "[4,   130] train_loss: 1.340 train_accuracy: 0.535 test_accuracy: 0.502\n",
            "[4,   135] train_loss: 1.284 train_accuracy: 0.513 test_accuracy: 0.481\n",
            "[4,   140] train_loss: 1.459 train_accuracy: 0.518 test_accuracy: 0.480\n",
            "[4,   145] train_loss: 1.458 train_accuracy: 0.522 test_accuracy: 0.484\n",
            "[4,   150] train_loss: 1.397 train_accuracy: 0.519 test_accuracy: 0.486\n",
            "[4,   155] train_loss: 1.437 train_accuracy: 0.525 test_accuracy: 0.493\n",
            "[4,   160] train_loss: 1.223 train_accuracy: 0.511 test_accuracy: 0.478\n",
            "[4,   165] train_loss: 1.356 train_accuracy: 0.522 test_accuracy: 0.483\n",
            "[4,   170] train_loss: 1.439 train_accuracy: 0.522 test_accuracy: 0.483\n",
            "[4,   175] train_loss: 1.309 train_accuracy: 0.528 test_accuracy: 0.486\n",
            "[4,   180] train_loss: 1.404 train_accuracy: 0.532 test_accuracy: 0.496\n",
            "[4,   185] train_loss: 1.282 train_accuracy: 0.526 test_accuracy: 0.487\n",
            "[4,   190] train_loss: 1.469 train_accuracy: 0.529 test_accuracy: 0.492\n",
            "[4,   195] train_loss: 1.325 train_accuracy: 0.533 test_accuracy: 0.492\n",
            "[4,   200] train_loss: 1.450 train_accuracy: 0.538 test_accuracy: 0.495\n",
            "[4,   205] train_loss: 1.407 train_accuracy: 0.536 test_accuracy: 0.498\n",
            "[4,   210] train_loss: 1.325 train_accuracy: 0.523 test_accuracy: 0.487\n",
            "[4,   215] train_loss: 1.500 train_accuracy: 0.512 test_accuracy: 0.484\n",
            "[4,   220] train_loss: 1.362 train_accuracy: 0.513 test_accuracy: 0.477\n",
            "[4,   225] train_loss: 1.451 train_accuracy: 0.529 test_accuracy: 0.486\n",
            "[4,   230] train_loss: 1.465 train_accuracy: 0.532 test_accuracy: 0.487\n",
            "[4,   235] train_loss: 1.342 train_accuracy: 0.518 test_accuracy: 0.480\n",
            "[4,   240] train_loss: 1.392 train_accuracy: 0.525 test_accuracy: 0.486\n",
            "[4,   245] train_loss: 1.462 train_accuracy: 0.528 test_accuracy: 0.489\n",
            "[4,   250] train_loss: 1.333 train_accuracy: 0.533 test_accuracy: 0.485\n",
            "[4,   255] train_loss: 1.324 train_accuracy: 0.528 test_accuracy: 0.486\n",
            "[4,   260] train_loss: 1.343 train_accuracy: 0.529 test_accuracy: 0.486\n",
            "[4,   265] train_loss: 1.247 train_accuracy: 0.532 test_accuracy: 0.485\n",
            "[4,   270] train_loss: 1.451 train_accuracy: 0.530 test_accuracy: 0.482\n",
            "[4,   275] train_loss: 1.451 train_accuracy: 0.524 test_accuracy: 0.488\n",
            "[4,   280] train_loss: 1.318 train_accuracy: 0.525 test_accuracy: 0.485\n",
            "[4,   285] train_loss: 1.336 train_accuracy: 0.520 test_accuracy: 0.485\n",
            "[4,   290] train_loss: 1.525 train_accuracy: 0.517 test_accuracy: 0.476\n",
            "[4,   295] train_loss: 1.474 train_accuracy: 0.533 test_accuracy: 0.489\n",
            "[4,   300] train_loss: 1.432 train_accuracy: 0.521 test_accuracy: 0.479\n",
            "[4,   305] train_loss: 1.401 train_accuracy: 0.523 test_accuracy: 0.485\n",
            "[4,   310] train_loss: 1.577 train_accuracy: 0.536 test_accuracy: 0.494\n",
            "[4,   315] train_loss: 1.347 train_accuracy: 0.532 test_accuracy: 0.496\n",
            "[4,   320] train_loss: 1.279 train_accuracy: 0.518 test_accuracy: 0.482\n",
            "[4,   325] train_loss: 1.506 train_accuracy: 0.521 test_accuracy: 0.485\n",
            "[4,   330] train_loss: 1.346 train_accuracy: 0.533 test_accuracy: 0.496\n",
            "[4,   335] train_loss: 1.397 train_accuracy: 0.517 test_accuracy: 0.490\n",
            "[4,   340] train_loss: 1.404 train_accuracy: 0.533 test_accuracy: 0.497\n",
            "[4,   345] train_loss: 1.421 train_accuracy: 0.544 test_accuracy: 0.499\n",
            "[4,   350] train_loss: 1.287 train_accuracy: 0.546 test_accuracy: 0.499\n",
            "[4,   355] train_loss: 1.496 train_accuracy: 0.538 test_accuracy: 0.489\n",
            "[4,   360] train_loss: 1.516 train_accuracy: 0.530 test_accuracy: 0.483\n",
            "[4,   365] train_loss: 1.267 train_accuracy: 0.539 test_accuracy: 0.500\n",
            "[4,   370] train_loss: 1.427 train_accuracy: 0.527 test_accuracy: 0.490\n",
            "[4,   375] train_loss: 1.408 train_accuracy: 0.529 test_accuracy: 0.488\n",
            "[4,   380] train_loss: 1.444 train_accuracy: 0.540 test_accuracy: 0.496\n",
            "[4,   385] train_loss: 1.241 train_accuracy: 0.534 test_accuracy: 0.488\n",
            "[4,   390] train_loss: 1.346 train_accuracy: 0.538 test_accuracy: 0.492\n",
            "[4,   395] train_loss: 1.424 train_accuracy: 0.538 test_accuracy: 0.493\n",
            "[4,   400] train_loss: 1.322 train_accuracy: 0.530 test_accuracy: 0.487\n",
            "[4,   405] train_loss: 1.395 train_accuracy: 0.527 test_accuracy: 0.477\n",
            "[4,   410] train_loss: 1.319 train_accuracy: 0.529 test_accuracy: 0.484\n",
            "[4,   415] train_loss: 1.449 train_accuracy: 0.534 test_accuracy: 0.488\n",
            "[4,   420] train_loss: 1.313 train_accuracy: 0.546 test_accuracy: 0.496\n",
            "[4,   425] train_loss: 1.379 train_accuracy: 0.526 test_accuracy: 0.494\n",
            "[4,   430] train_loss: 1.388 train_accuracy: 0.522 test_accuracy: 0.487\n",
            "[4,   435] train_loss: 1.410 train_accuracy: 0.538 test_accuracy: 0.495\n",
            "[4,   440] train_loss: 1.340 train_accuracy: 0.528 test_accuracy: 0.491\n",
            "[4,   445] train_loss: 1.396 train_accuracy: 0.520 test_accuracy: 0.480\n",
            "[4,   450] train_loss: 1.388 train_accuracy: 0.539 test_accuracy: 0.491\n",
            "[4,   455] train_loss: 1.229 train_accuracy: 0.533 test_accuracy: 0.484\n",
            "[4,   460] train_loss: 1.336 train_accuracy: 0.525 test_accuracy: 0.482\n",
            "[4,   465] train_loss: 1.366 train_accuracy: 0.526 test_accuracy: 0.479\n",
            "[4,   470] train_loss: 1.288 train_accuracy: 0.524 test_accuracy: 0.480\n",
            "[4,   475] train_loss: 1.483 train_accuracy: 0.535 test_accuracy: 0.487\n",
            "[4,   480] train_loss: 1.564 train_accuracy: 0.513 test_accuracy: 0.474\n",
            "[4,   485] train_loss: 1.469 train_accuracy: 0.531 test_accuracy: 0.490\n",
            "[4,   490] train_loss: 1.448 train_accuracy: 0.534 test_accuracy: 0.496\n",
            "[4,   495] train_loss: 1.424 train_accuracy: 0.526 test_accuracy: 0.489\n",
            "[4,   500] train_loss: 1.459 train_accuracy: 0.515 test_accuracy: 0.482\n",
            "[4,   505] train_loss: 1.369 train_accuracy: 0.520 test_accuracy: 0.488\n",
            "[4,   510] train_loss: 1.348 train_accuracy: 0.526 test_accuracy: 0.486\n",
            "[4,   515] train_loss: 1.474 train_accuracy: 0.525 test_accuracy: 0.477\n",
            "[4,   520] train_loss: 1.399 train_accuracy: 0.533 test_accuracy: 0.491\n",
            "[4,   525] train_loss: 1.356 train_accuracy: 0.533 test_accuracy: 0.489\n",
            "[4,   530] train_loss: 1.435 train_accuracy: 0.538 test_accuracy: 0.492\n",
            "[4,   535] train_loss: 1.343 train_accuracy: 0.534 test_accuracy: 0.486\n",
            "[4,   540] train_loss: 1.382 train_accuracy: 0.530 test_accuracy: 0.492\n",
            "[4,   545] train_loss: 1.231 train_accuracy: 0.536 test_accuracy: 0.494\n",
            "[4,   550] train_loss: 1.264 train_accuracy: 0.530 test_accuracy: 0.492\n",
            "[4,   555] train_loss: 1.424 train_accuracy: 0.536 test_accuracy: 0.498\n",
            "[4,   560] train_loss: 1.436 train_accuracy: 0.537 test_accuracy: 0.496\n",
            "[4,   565] train_loss: 1.432 train_accuracy: 0.542 test_accuracy: 0.496\n",
            "[4,   570] train_loss: 1.323 train_accuracy: 0.536 test_accuracy: 0.488\n",
            "[4,   575] train_loss: 1.429 train_accuracy: 0.540 test_accuracy: 0.495\n",
            "[4,   580] train_loss: 1.381 train_accuracy: 0.545 test_accuracy: 0.499\n",
            "[4,   585] train_loss: 1.305 train_accuracy: 0.549 test_accuracy: 0.500\n",
            "[4,   590] train_loss: 1.366 train_accuracy: 0.544 test_accuracy: 0.496\n",
            "[4,   595] train_loss: 1.199 train_accuracy: 0.545 test_accuracy: 0.494\n",
            "[4,   600] train_loss: 1.340 train_accuracy: 0.541 test_accuracy: 0.494\n",
            "[4,   605] train_loss: 1.402 train_accuracy: 0.540 test_accuracy: 0.489\n",
            "[4,   610] train_loss: 1.513 train_accuracy: 0.528 test_accuracy: 0.482\n",
            "[4,   615] train_loss: 1.413 train_accuracy: 0.527 test_accuracy: 0.484\n",
            "[4,   620] train_loss: 1.405 train_accuracy: 0.519 test_accuracy: 0.478\n",
            "[4,   625] train_loss: 1.403 train_accuracy: 0.543 test_accuracy: 0.493\n",
            "[4,   630] train_loss: 1.314 train_accuracy: 0.543 test_accuracy: 0.497\n",
            "[4,   635] train_loss: 1.227 train_accuracy: 0.537 test_accuracy: 0.487\n",
            "[4,   640] train_loss: 1.419 train_accuracy: 0.530 test_accuracy: 0.482\n",
            "[4,   645] train_loss: 1.543 train_accuracy: 0.539 test_accuracy: 0.489\n",
            "[4,   650] train_loss: 1.315 train_accuracy: 0.513 test_accuracy: 0.473\n",
            "[4,   655] train_loss: 1.341 train_accuracy: 0.535 test_accuracy: 0.492\n",
            "[4,   660] train_loss: 1.475 train_accuracy: 0.537 test_accuracy: 0.493\n",
            "[4,   665] train_loss: 1.412 train_accuracy: 0.531 test_accuracy: 0.488\n",
            "[4,   670] train_loss: 1.304 train_accuracy: 0.534 test_accuracy: 0.485\n",
            "[4,   675] train_loss: 1.205 train_accuracy: 0.538 test_accuracy: 0.488\n",
            "[4,   680] train_loss: 1.398 train_accuracy: 0.549 test_accuracy: 0.493\n",
            "[4,   685] train_loss: 1.364 train_accuracy: 0.539 test_accuracy: 0.490\n",
            "[4,   690] train_loss: 1.203 train_accuracy: 0.534 test_accuracy: 0.486\n",
            "[4,   695] train_loss: 1.365 train_accuracy: 0.548 test_accuracy: 0.498\n",
            "[4,   700] train_loss: 1.442 train_accuracy: 0.549 test_accuracy: 0.505\n",
            "[4,   705] train_loss: 1.307 train_accuracy: 0.547 test_accuracy: 0.501\n",
            "[4,   710] train_loss: 1.423 train_accuracy: 0.522 test_accuracy: 0.487\n",
            "[4,   715] train_loss: 1.374 train_accuracy: 0.547 test_accuracy: 0.504\n",
            "[4,   720] train_loss: 1.428 train_accuracy: 0.548 test_accuracy: 0.498\n",
            "[4,   725] train_loss: 1.363 train_accuracy: 0.536 test_accuracy: 0.491\n",
            "[4,   730] train_loss: 1.405 train_accuracy: 0.550 test_accuracy: 0.501\n",
            "[4,   735] train_loss: 1.347 train_accuracy: 0.540 test_accuracy: 0.488\n",
            "[4,   740] train_loss: 1.462 train_accuracy: 0.552 test_accuracy: 0.506\n",
            "[4,   745] train_loss: 1.356 train_accuracy: 0.548 test_accuracy: 0.503\n",
            "[4,   750] train_loss: 1.242 train_accuracy: 0.550 test_accuracy: 0.504\n",
            "[4,   755] train_loss: 1.380 train_accuracy: 0.537 test_accuracy: 0.492\n",
            "[4,   760] train_loss: 1.382 train_accuracy: 0.542 test_accuracy: 0.504\n",
            "[4,   765] train_loss: 1.453 train_accuracy: 0.538 test_accuracy: 0.499\n",
            "[4,   770] train_loss: 1.368 train_accuracy: 0.532 test_accuracy: 0.489\n",
            "[4,   775] train_loss: 1.332 train_accuracy: 0.544 test_accuracy: 0.499\n",
            "[4,   780] train_loss: 1.294 train_accuracy: 0.537 test_accuracy: 0.489\n",
            "[4,   785] train_loss: 1.342 train_accuracy: 0.546 test_accuracy: 0.501\n",
            "[4,   790] train_loss: 1.531 train_accuracy: 0.542 test_accuracy: 0.496\n",
            "[4,   795] train_loss: 1.364 train_accuracy: 0.530 test_accuracy: 0.483\n",
            "[4,   800] train_loss: 1.313 train_accuracy: 0.549 test_accuracy: 0.500\n",
            "[4,   805] train_loss: 1.398 train_accuracy: 0.538 test_accuracy: 0.491\n",
            "[4,   810] train_loss: 1.286 train_accuracy: 0.546 test_accuracy: 0.502\n",
            "[4,   815] train_loss: 1.265 train_accuracy: 0.541 test_accuracy: 0.497\n",
            "[4,   820] train_loss: 1.347 train_accuracy: 0.535 test_accuracy: 0.489\n",
            "[4,   825] train_loss: 1.289 train_accuracy: 0.547 test_accuracy: 0.499\n",
            "[4,   830] train_loss: 1.327 train_accuracy: 0.541 test_accuracy: 0.493\n",
            "[4,   835] train_loss: 1.295 train_accuracy: 0.529 test_accuracy: 0.485\n",
            "[4,   840] train_loss: 1.398 train_accuracy: 0.521 test_accuracy: 0.483\n",
            "[4,   845] train_loss: 1.419 train_accuracy: 0.533 test_accuracy: 0.492\n",
            "[4,   850] train_loss: 1.431 train_accuracy: 0.540 test_accuracy: 0.492\n",
            "[4,   855] train_loss: 1.390 train_accuracy: 0.541 test_accuracy: 0.495\n",
            "[4,   860] train_loss: 1.300 train_accuracy: 0.537 test_accuracy: 0.489\n",
            "[4,   865] train_loss: 1.433 train_accuracy: 0.553 test_accuracy: 0.496\n",
            "[4,   870] train_loss: 1.318 train_accuracy: 0.558 test_accuracy: 0.497\n",
            "[4,   875] train_loss: 1.294 train_accuracy: 0.557 test_accuracy: 0.508\n",
            "[4,   880] train_loss: 1.196 train_accuracy: 0.559 test_accuracy: 0.509\n",
            "[4,   885] train_loss: 1.357 train_accuracy: 0.555 test_accuracy: 0.501\n",
            "[4,   890] train_loss: 1.436 train_accuracy: 0.548 test_accuracy: 0.501\n",
            "[4,   895] train_loss: 1.331 train_accuracy: 0.558 test_accuracy: 0.509\n",
            "[4,   900] train_loss: 1.247 train_accuracy: 0.548 test_accuracy: 0.499\n",
            "[4,   905] train_loss: 1.445 train_accuracy: 0.544 test_accuracy: 0.490\n",
            "[4,   910] train_loss: 1.379 train_accuracy: 0.551 test_accuracy: 0.497\n",
            "[4,   915] train_loss: 1.525 train_accuracy: 0.543 test_accuracy: 0.491\n",
            "[4,   920] train_loss: 1.449 train_accuracy: 0.551 test_accuracy: 0.498\n",
            "[4,   925] train_loss: 1.357 train_accuracy: 0.545 test_accuracy: 0.495\n",
            "[4,   930] train_loss: 1.472 train_accuracy: 0.548 test_accuracy: 0.499\n",
            "[4,   935] train_loss: 1.491 train_accuracy: 0.549 test_accuracy: 0.503\n",
            "[4,   940] train_loss: 1.411 train_accuracy: 0.544 test_accuracy: 0.499\n",
            "[4,   945] train_loss: 1.381 train_accuracy: 0.544 test_accuracy: 0.501\n",
            "[4,   950] train_loss: 1.308 train_accuracy: 0.555 test_accuracy: 0.511\n",
            "[4,   955] train_loss: 1.493 train_accuracy: 0.555 test_accuracy: 0.505\n",
            "[4,   960] train_loss: 1.319 train_accuracy: 0.555 test_accuracy: 0.502\n",
            "[4,   965] train_loss: 1.288 train_accuracy: 0.555 test_accuracy: 0.504\n",
            "[4,   970] train_loss: 1.447 train_accuracy: 0.552 test_accuracy: 0.507\n",
            "[4,   975] train_loss: 1.359 train_accuracy: 0.539 test_accuracy: 0.498\n",
            "[4,   980] train_loss: 1.332 train_accuracy: 0.548 test_accuracy: 0.500\n",
            "[4,   985] train_loss: 1.422 train_accuracy: 0.550 test_accuracy: 0.496\n",
            "[4,   990] train_loss: 1.395 train_accuracy: 0.531 test_accuracy: 0.482\n",
            "[4,   995] train_loss: 1.405 train_accuracy: 0.527 test_accuracy: 0.480\n",
            "[4,  1000] train_loss: 1.324 train_accuracy: 0.530 test_accuracy: 0.483\n",
            "[4,  1005] train_loss: 1.396 train_accuracy: 0.542 test_accuracy: 0.494\n",
            "[4,  1010] train_loss: 1.388 train_accuracy: 0.534 test_accuracy: 0.489\n",
            "[4,  1015] train_loss: 1.440 train_accuracy: 0.543 test_accuracy: 0.494\n",
            "[4,  1020] train_loss: 1.329 train_accuracy: 0.540 test_accuracy: 0.494\n",
            "[4,  1025] train_loss: 1.292 train_accuracy: 0.544 test_accuracy: 0.497\n",
            "[4,  1030] train_loss: 1.577 train_accuracy: 0.545 test_accuracy: 0.495\n",
            "[4,  1035] train_loss: 1.277 train_accuracy: 0.555 test_accuracy: 0.502\n",
            "[4,  1040] train_loss: 1.306 train_accuracy: 0.552 test_accuracy: 0.502\n",
            "[4,  1045] train_loss: 1.418 train_accuracy: 0.541 test_accuracy: 0.491\n",
            "[4,  1050] train_loss: 1.372 train_accuracy: 0.540 test_accuracy: 0.493\n",
            "[4,  1055] train_loss: 1.516 train_accuracy: 0.550 test_accuracy: 0.494\n",
            "[4,  1060] train_loss: 1.227 train_accuracy: 0.548 test_accuracy: 0.493\n",
            "[4,  1065] train_loss: 1.361 train_accuracy: 0.543 test_accuracy: 0.492\n",
            "[4,  1070] train_loss: 1.354 train_accuracy: 0.538 test_accuracy: 0.485\n",
            "[4,  1075] train_loss: 1.405 train_accuracy: 0.534 test_accuracy: 0.484\n",
            "[4,  1080] train_loss: 1.466 train_accuracy: 0.539 test_accuracy: 0.480\n",
            "[4,  1085] train_loss: 1.436 train_accuracy: 0.549 test_accuracy: 0.490\n",
            "[4,  1090] train_loss: 1.297 train_accuracy: 0.555 test_accuracy: 0.496\n",
            "[4,  1095] train_loss: 1.356 train_accuracy: 0.554 test_accuracy: 0.501\n",
            "[4,  1100] train_loss: 1.402 train_accuracy: 0.539 test_accuracy: 0.482\n",
            "[4,  1105] train_loss: 1.460 train_accuracy: 0.544 test_accuracy: 0.491\n",
            "[4,  1110] train_loss: 1.320 train_accuracy: 0.554 test_accuracy: 0.505\n",
            "[4,  1115] train_loss: 1.392 train_accuracy: 0.554 test_accuracy: 0.500\n",
            "[4,  1120] train_loss: 1.407 train_accuracy: 0.561 test_accuracy: 0.504\n",
            "[4,  1125] train_loss: 1.550 train_accuracy: 0.559 test_accuracy: 0.500\n",
            "[4,  1130] train_loss: 1.387 train_accuracy: 0.556 test_accuracy: 0.498\n",
            "[4,  1135] train_loss: 1.350 train_accuracy: 0.532 test_accuracy: 0.484\n",
            "[4,  1140] train_loss: 1.247 train_accuracy: 0.522 test_accuracy: 0.477\n",
            "[4,  1145] train_loss: 1.366 train_accuracy: 0.533 test_accuracy: 0.476\n",
            "[4,  1150] train_loss: 1.468 train_accuracy: 0.542 test_accuracy: 0.485\n",
            "[4,  1155] train_loss: 1.256 train_accuracy: 0.549 test_accuracy: 0.497\n",
            "[4,  1160] train_loss: 1.392 train_accuracy: 0.545 test_accuracy: 0.500\n",
            "[4,  1165] train_loss: 1.232 train_accuracy: 0.545 test_accuracy: 0.499\n",
            "[4,  1170] train_loss: 1.327 train_accuracy: 0.540 test_accuracy: 0.489\n",
            "[4,  1175] train_loss: 1.284 train_accuracy: 0.556 test_accuracy: 0.505\n",
            "[4,  1180] train_loss: 1.412 train_accuracy: 0.549 test_accuracy: 0.497\n",
            "[4,  1185] train_loss: 1.380 train_accuracy: 0.548 test_accuracy: 0.492\n",
            "[4,  1190] train_loss: 1.438 train_accuracy: 0.548 test_accuracy: 0.496\n",
            "[4,  1195] train_loss: 1.425 train_accuracy: 0.560 test_accuracy: 0.506\n",
            "[4,  1200] train_loss: 1.310 train_accuracy: 0.552 test_accuracy: 0.494\n",
            "[4,  1205] train_loss: 1.320 train_accuracy: 0.533 test_accuracy: 0.480\n",
            "[4,  1210] train_loss: 1.495 train_accuracy: 0.549 test_accuracy: 0.493\n",
            "[4,  1215] train_loss: 1.289 train_accuracy: 0.551 test_accuracy: 0.494\n",
            "[4,  1220] train_loss: 1.320 train_accuracy: 0.545 test_accuracy: 0.493\n",
            "[4,  1225] train_loss: 1.482 train_accuracy: 0.548 test_accuracy: 0.497\n",
            "[4,  1230] train_loss: 1.392 train_accuracy: 0.549 test_accuracy: 0.503\n",
            "[4,  1235] train_loss: 1.389 train_accuracy: 0.542 test_accuracy: 0.495\n",
            "[4,  1240] train_loss: 1.309 train_accuracy: 0.551 test_accuracy: 0.499\n",
            "[4,  1245] train_loss: 1.280 train_accuracy: 0.546 test_accuracy: 0.498\n",
            "[5,     5] train_loss: 1.266 train_accuracy: 0.533 test_accuracy: 0.492\n",
            "[5,    10] train_loss: 1.467 train_accuracy: 0.529 test_accuracy: 0.487\n",
            "[5,    15] train_loss: 1.370 train_accuracy: 0.542 test_accuracy: 0.492\n",
            "[5,    20] train_loss: 1.356 train_accuracy: 0.545 test_accuracy: 0.493\n",
            "[5,    25] train_loss: 1.347 train_accuracy: 0.539 test_accuracy: 0.485\n",
            "[5,    30] train_loss: 1.329 train_accuracy: 0.550 test_accuracy: 0.494\n",
            "[5,    35] train_loss: 1.412 train_accuracy: 0.556 test_accuracy: 0.504\n",
            "[5,    40] train_loss: 1.505 train_accuracy: 0.548 test_accuracy: 0.495\n",
            "[5,    45] train_loss: 1.158 train_accuracy: 0.540 test_accuracy: 0.486\n",
            "[5,    50] train_loss: 1.413 train_accuracy: 0.541 test_accuracy: 0.490\n",
            "[5,    55] train_loss: 1.370 train_accuracy: 0.531 test_accuracy: 0.482\n",
            "[5,    60] train_loss: 1.323 train_accuracy: 0.553 test_accuracy: 0.489\n",
            "[5,    65] train_loss: 1.240 train_accuracy: 0.550 test_accuracy: 0.493\n",
            "[5,    70] train_loss: 1.284 train_accuracy: 0.549 test_accuracy: 0.496\n",
            "[5,    75] train_loss: 1.257 train_accuracy: 0.560 test_accuracy: 0.504\n",
            "[5,    80] train_loss: 1.208 train_accuracy: 0.558 test_accuracy: 0.501\n",
            "[5,    85] train_loss: 1.289 train_accuracy: 0.557 test_accuracy: 0.503\n",
            "[5,    90] train_loss: 1.288 train_accuracy: 0.551 test_accuracy: 0.500\n",
            "[5,    95] train_loss: 1.364 train_accuracy: 0.541 test_accuracy: 0.490\n",
            "[5,   100] train_loss: 1.272 train_accuracy: 0.558 test_accuracy: 0.504\n",
            "[5,   105] train_loss: 1.331 train_accuracy: 0.545 test_accuracy: 0.487\n",
            "[5,   110] train_loss: 1.285 train_accuracy: 0.544 test_accuracy: 0.488\n",
            "[5,   115] train_loss: 1.351 train_accuracy: 0.559 test_accuracy: 0.507\n",
            "[5,   120] train_loss: 1.147 train_accuracy: 0.555 test_accuracy: 0.504\n",
            "[5,   125] train_loss: 1.305 train_accuracy: 0.561 test_accuracy: 0.511\n",
            "[5,   130] train_loss: 1.225 train_accuracy: 0.571 test_accuracy: 0.503\n",
            "[5,   135] train_loss: 1.365 train_accuracy: 0.562 test_accuracy: 0.503\n",
            "[5,   140] train_loss: 1.346 train_accuracy: 0.557 test_accuracy: 0.497\n",
            "[5,   145] train_loss: 1.293 train_accuracy: 0.536 test_accuracy: 0.485\n",
            "[5,   150] train_loss: 1.260 train_accuracy: 0.538 test_accuracy: 0.482\n",
            "[5,   155] train_loss: 1.403 train_accuracy: 0.545 test_accuracy: 0.491\n",
            "[5,   160] train_loss: 1.180 train_accuracy: 0.546 test_accuracy: 0.490\n",
            "[5,   165] train_loss: 1.153 train_accuracy: 0.547 test_accuracy: 0.491\n",
            "[5,   170] train_loss: 1.241 train_accuracy: 0.546 test_accuracy: 0.497\n",
            "[5,   175] train_loss: 1.383 train_accuracy: 0.548 test_accuracy: 0.500\n",
            "[5,   180] train_loss: 1.204 train_accuracy: 0.538 test_accuracy: 0.487\n",
            "[5,   185] train_loss: 1.350 train_accuracy: 0.539 test_accuracy: 0.486\n",
            "[5,   190] train_loss: 1.348 train_accuracy: 0.547 test_accuracy: 0.501\n",
            "[5,   195] train_loss: 1.361 train_accuracy: 0.558 test_accuracy: 0.509\n",
            "[5,   200] train_loss: 1.276 train_accuracy: 0.557 test_accuracy: 0.507\n",
            "[5,   205] train_loss: 1.319 train_accuracy: 0.550 test_accuracy: 0.497\n",
            "[5,   210] train_loss: 1.369 train_accuracy: 0.552 test_accuracy: 0.493\n",
            "[5,   215] train_loss: 1.345 train_accuracy: 0.558 test_accuracy: 0.500\n",
            "[5,   220] train_loss: 1.359 train_accuracy: 0.552 test_accuracy: 0.495\n",
            "[5,   225] train_loss: 1.184 train_accuracy: 0.548 test_accuracy: 0.494\n",
            "[5,   230] train_loss: 1.403 train_accuracy: 0.549 test_accuracy: 0.487\n",
            "[5,   235] train_loss: 1.425 train_accuracy: 0.559 test_accuracy: 0.496\n",
            "[5,   240] train_loss: 1.173 train_accuracy: 0.555 test_accuracy: 0.502\n",
            "[5,   245] train_loss: 1.350 train_accuracy: 0.549 test_accuracy: 0.499\n",
            "[5,   250] train_loss: 1.284 train_accuracy: 0.557 test_accuracy: 0.495\n",
            "[5,   255] train_loss: 1.240 train_accuracy: 0.555 test_accuracy: 0.497\n",
            "[5,   260] train_loss: 1.279 train_accuracy: 0.535 test_accuracy: 0.482\n",
            "[5,   265] train_loss: 1.186 train_accuracy: 0.557 test_accuracy: 0.499\n",
            "[5,   270] train_loss: 1.182 train_accuracy: 0.569 test_accuracy: 0.507\n",
            "[5,   275] train_loss: 1.203 train_accuracy: 0.565 test_accuracy: 0.504\n",
            "[5,   280] train_loss: 1.362 train_accuracy: 0.568 test_accuracy: 0.504\n",
            "[5,   285] train_loss: 1.433 train_accuracy: 0.553 test_accuracy: 0.492\n",
            "[5,   290] train_loss: 1.411 train_accuracy: 0.520 test_accuracy: 0.469\n",
            "[5,   295] train_loss: 1.432 train_accuracy: 0.532 test_accuracy: 0.484\n",
            "[5,   300] train_loss: 1.224 train_accuracy: 0.539 test_accuracy: 0.486\n",
            "[5,   305] train_loss: 1.268 train_accuracy: 0.554 test_accuracy: 0.496\n",
            "[5,   310] train_loss: 1.328 train_accuracy: 0.554 test_accuracy: 0.496\n",
            "[5,   315] train_loss: 1.279 train_accuracy: 0.554 test_accuracy: 0.502\n",
            "[5,   320] train_loss: 1.366 train_accuracy: 0.562 test_accuracy: 0.502\n",
            "[5,   325] train_loss: 1.216 train_accuracy: 0.565 test_accuracy: 0.502\n",
            "[5,   330] train_loss: 1.290 train_accuracy: 0.563 test_accuracy: 0.504\n",
            "[5,   335] train_loss: 1.284 train_accuracy: 0.567 test_accuracy: 0.505\n",
            "[5,   340] train_loss: 1.329 train_accuracy: 0.557 test_accuracy: 0.502\n",
            "[5,   345] train_loss: 1.300 train_accuracy: 0.549 test_accuracy: 0.493\n",
            "[5,   350] train_loss: 1.302 train_accuracy: 0.548 test_accuracy: 0.496\n",
            "[5,   355] train_loss: 1.300 train_accuracy: 0.543 test_accuracy: 0.489\n",
            "[5,   360] train_loss: 1.419 train_accuracy: 0.546 test_accuracy: 0.491\n",
            "[5,   365] train_loss: 1.355 train_accuracy: 0.539 test_accuracy: 0.482\n",
            "[5,   370] train_loss: 1.464 train_accuracy: 0.545 test_accuracy: 0.488\n",
            "[5,   375] train_loss: 1.286 train_accuracy: 0.545 test_accuracy: 0.485\n",
            "[5,   380] train_loss: 1.390 train_accuracy: 0.557 test_accuracy: 0.501\n",
            "[5,   385] train_loss: 1.316 train_accuracy: 0.557 test_accuracy: 0.497\n",
            "[5,   390] train_loss: 1.356 train_accuracy: 0.560 test_accuracy: 0.499\n",
            "[5,   395] train_loss: 1.088 train_accuracy: 0.562 test_accuracy: 0.498\n",
            "[5,   400] train_loss: 1.270 train_accuracy: 0.561 test_accuracy: 0.503\n",
            "[5,   405] train_loss: 1.221 train_accuracy: 0.561 test_accuracy: 0.504\n",
            "[5,   410] train_loss: 1.369 train_accuracy: 0.565 test_accuracy: 0.502\n",
            "[5,   415] train_loss: 1.309 train_accuracy: 0.559 test_accuracy: 0.502\n",
            "[5,   420] train_loss: 1.285 train_accuracy: 0.556 test_accuracy: 0.505\n",
            "[5,   425] train_loss: 1.301 train_accuracy: 0.562 test_accuracy: 0.506\n",
            "[5,   430] train_loss: 1.198 train_accuracy: 0.565 test_accuracy: 0.507\n",
            "[5,   435] train_loss: 1.136 train_accuracy: 0.565 test_accuracy: 0.507\n",
            "[5,   440] train_loss: 1.217 train_accuracy: 0.563 test_accuracy: 0.507\n",
            "[5,   445] train_loss: 1.283 train_accuracy: 0.568 test_accuracy: 0.510\n",
            "[5,   450] train_loss: 1.238 train_accuracy: 0.561 test_accuracy: 0.500\n",
            "[5,   455] train_loss: 1.395 train_accuracy: 0.546 test_accuracy: 0.488\n",
            "[5,   460] train_loss: 1.255 train_accuracy: 0.550 test_accuracy: 0.490\n",
            "[5,   465] train_loss: 1.318 train_accuracy: 0.554 test_accuracy: 0.492\n",
            "[5,   470] train_loss: 1.385 train_accuracy: 0.552 test_accuracy: 0.496\n",
            "[5,   475] train_loss: 1.379 train_accuracy: 0.559 test_accuracy: 0.496\n",
            "[5,   480] train_loss: 1.323 train_accuracy: 0.565 test_accuracy: 0.497\n",
            "[5,   485] train_loss: 1.385 train_accuracy: 0.579 test_accuracy: 0.505\n",
            "[5,   490] train_loss: 1.336 train_accuracy: 0.565 test_accuracy: 0.499\n",
            "[5,   495] train_loss: 1.287 train_accuracy: 0.567 test_accuracy: 0.502\n",
            "[5,   500] train_loss: 1.262 train_accuracy: 0.575 test_accuracy: 0.507\n",
            "[5,   505] train_loss: 1.294 train_accuracy: 0.567 test_accuracy: 0.501\n",
            "[5,   510] train_loss: 1.176 train_accuracy: 0.574 test_accuracy: 0.505\n",
            "[5,   515] train_loss: 1.170 train_accuracy: 0.579 test_accuracy: 0.503\n",
            "[5,   520] train_loss: 1.402 train_accuracy: 0.565 test_accuracy: 0.496\n",
            "[5,   525] train_loss: 1.271 train_accuracy: 0.552 test_accuracy: 0.488\n",
            "[5,   530] train_loss: 1.358 train_accuracy: 0.564 test_accuracy: 0.498\n",
            "[5,   535] train_loss: 1.217 train_accuracy: 0.561 test_accuracy: 0.495\n",
            "[5,   540] train_loss: 1.180 train_accuracy: 0.554 test_accuracy: 0.496\n",
            "[5,   545] train_loss: 1.292 train_accuracy: 0.554 test_accuracy: 0.494\n",
            "[5,   550] train_loss: 1.382 train_accuracy: 0.549 test_accuracy: 0.494\n",
            "[5,   555] train_loss: 1.323 train_accuracy: 0.548 test_accuracy: 0.498\n",
            "[5,   560] train_loss: 1.408 train_accuracy: 0.555 test_accuracy: 0.504\n",
            "[5,   565] train_loss: 1.355 train_accuracy: 0.558 test_accuracy: 0.500\n",
            "[5,   570] train_loss: 1.409 train_accuracy: 0.560 test_accuracy: 0.500\n",
            "[5,   575] train_loss: 1.276 train_accuracy: 0.563 test_accuracy: 0.500\n",
            "[5,   580] train_loss: 1.414 train_accuracy: 0.570 test_accuracy: 0.504\n",
            "[5,   585] train_loss: 1.224 train_accuracy: 0.566 test_accuracy: 0.504\n",
            "[5,   590] train_loss: 1.288 train_accuracy: 0.568 test_accuracy: 0.503\n",
            "[5,   595] train_loss: 1.241 train_accuracy: 0.552 test_accuracy: 0.501\n",
            "[5,   600] train_loss: 1.328 train_accuracy: 0.553 test_accuracy: 0.503\n",
            "[5,   605] train_loss: 1.475 train_accuracy: 0.555 test_accuracy: 0.491\n",
            "[5,   610] train_loss: 1.364 train_accuracy: 0.561 test_accuracy: 0.494\n",
            "[5,   615] train_loss: 1.309 train_accuracy: 0.540 test_accuracy: 0.484\n",
            "[5,   620] train_loss: 1.312 train_accuracy: 0.542 test_accuracy: 0.488\n",
            "[5,   625] train_loss: 1.258 train_accuracy: 0.542 test_accuracy: 0.484\n",
            "[5,   630] train_loss: 1.263 train_accuracy: 0.545 test_accuracy: 0.492\n",
            "[5,   635] train_loss: 1.338 train_accuracy: 0.560 test_accuracy: 0.504\n",
            "[5,   640] train_loss: 1.280 train_accuracy: 0.559 test_accuracy: 0.503\n",
            "[5,   645] train_loss: 1.314 train_accuracy: 0.551 test_accuracy: 0.500\n",
            "[5,   650] train_loss: 1.308 train_accuracy: 0.555 test_accuracy: 0.506\n",
            "[5,   655] train_loss: 1.304 train_accuracy: 0.557 test_accuracy: 0.501\n",
            "[5,   660] train_loss: 1.269 train_accuracy: 0.556 test_accuracy: 0.491\n",
            "[5,   665] train_loss: 1.317 train_accuracy: 0.558 test_accuracy: 0.491\n",
            "[5,   670] train_loss: 1.336 train_accuracy: 0.563 test_accuracy: 0.499\n",
            "[5,   675] train_loss: 1.211 train_accuracy: 0.568 test_accuracy: 0.505\n",
            "[5,   680] train_loss: 1.386 train_accuracy: 0.573 test_accuracy: 0.504\n",
            "[5,   685] train_loss: 1.348 train_accuracy: 0.566 test_accuracy: 0.501\n",
            "[5,   690] train_loss: 1.397 train_accuracy: 0.566 test_accuracy: 0.497\n",
            "[5,   695] train_loss: 1.274 train_accuracy: 0.553 test_accuracy: 0.487\n",
            "[5,   700] train_loss: 1.229 train_accuracy: 0.548 test_accuracy: 0.494\n",
            "[5,   705] train_loss: 1.386 train_accuracy: 0.565 test_accuracy: 0.505\n",
            "[5,   710] train_loss: 1.250 train_accuracy: 0.571 test_accuracy: 0.510\n",
            "[5,   715] train_loss: 1.241 train_accuracy: 0.573 test_accuracy: 0.507\n",
            "[5,   720] train_loss: 1.314 train_accuracy: 0.569 test_accuracy: 0.501\n",
            "[5,   725] train_loss: 1.231 train_accuracy: 0.558 test_accuracy: 0.491\n",
            "[5,   730] train_loss: 1.356 train_accuracy: 0.558 test_accuracy: 0.486\n",
            "[5,   735] train_loss: 1.283 train_accuracy: 0.560 test_accuracy: 0.485\n",
            "[5,   740] train_loss: 1.413 train_accuracy: 0.553 test_accuracy: 0.492\n",
            "[5,   745] train_loss: 1.342 train_accuracy: 0.567 test_accuracy: 0.503\n",
            "[5,   750] train_loss: 1.269 train_accuracy: 0.571 test_accuracy: 0.508\n",
            "[5,   755] train_loss: 1.322 train_accuracy: 0.561 test_accuracy: 0.497\n",
            "[5,   760] train_loss: 1.236 train_accuracy: 0.570 test_accuracy: 0.504\n",
            "[5,   765] train_loss: 1.173 train_accuracy: 0.553 test_accuracy: 0.489\n",
            "[5,   770] train_loss: 1.352 train_accuracy: 0.556 test_accuracy: 0.486\n",
            "[5,   775] train_loss: 1.510 train_accuracy: 0.562 test_accuracy: 0.496\n",
            "[5,   780] train_loss: 1.287 train_accuracy: 0.553 test_accuracy: 0.485\n",
            "[5,   785] train_loss: 1.352 train_accuracy: 0.554 test_accuracy: 0.492\n",
            "[5,   790] train_loss: 1.308 train_accuracy: 0.558 test_accuracy: 0.491\n",
            "[5,   795] train_loss: 1.299 train_accuracy: 0.569 test_accuracy: 0.505\n",
            "[5,   800] train_loss: 1.394 train_accuracy: 0.568 test_accuracy: 0.504\n",
            "[5,   805] train_loss: 1.280 train_accuracy: 0.576 test_accuracy: 0.507\n",
            "[5,   810] train_loss: 1.350 train_accuracy: 0.570 test_accuracy: 0.502\n",
            "[5,   815] train_loss: 1.366 train_accuracy: 0.576 test_accuracy: 0.506\n",
            "[5,   820] train_loss: 1.294 train_accuracy: 0.565 test_accuracy: 0.497\n",
            "[5,   825] train_loss: 1.275 train_accuracy: 0.575 test_accuracy: 0.510\n",
            "[5,   830] train_loss: 1.229 train_accuracy: 0.573 test_accuracy: 0.506\n",
            "[5,   835] train_loss: 1.282 train_accuracy: 0.568 test_accuracy: 0.501\n",
            "[5,   840] train_loss: 1.244 train_accuracy: 0.560 test_accuracy: 0.497\n",
            "[5,   845] train_loss: 1.308 train_accuracy: 0.565 test_accuracy: 0.504\n",
            "[5,   850] train_loss: 1.349 train_accuracy: 0.562 test_accuracy: 0.501\n",
            "[5,   855] train_loss: 1.279 train_accuracy: 0.563 test_accuracy: 0.502\n",
            "[5,   860] train_loss: 1.410 train_accuracy: 0.553 test_accuracy: 0.498\n",
            "[5,   865] train_loss: 1.270 train_accuracy: 0.556 test_accuracy: 0.491\n",
            "[5,   870] train_loss: 1.444 train_accuracy: 0.553 test_accuracy: 0.486\n",
            "[5,   875] train_loss: 1.299 train_accuracy: 0.561 test_accuracy: 0.498\n",
            "[5,   880] train_loss: 1.312 train_accuracy: 0.567 test_accuracy: 0.503\n",
            "[5,   885] train_loss: 1.353 train_accuracy: 0.569 test_accuracy: 0.512\n",
            "[5,   890] train_loss: 1.440 train_accuracy: 0.560 test_accuracy: 0.507\n",
            "[5,   895] train_loss: 1.369 train_accuracy: 0.567 test_accuracy: 0.509\n",
            "[5,   900] train_loss: 1.212 train_accuracy: 0.569 test_accuracy: 0.512\n",
            "[5,   905] train_loss: 1.482 train_accuracy: 0.577 test_accuracy: 0.520\n",
            "[5,   910] train_loss: 1.263 train_accuracy: 0.565 test_accuracy: 0.505\n",
            "[5,   915] train_loss: 1.246 train_accuracy: 0.572 test_accuracy: 0.510\n",
            "[5,   920] train_loss: 1.293 train_accuracy: 0.577 test_accuracy: 0.514\n",
            "[5,   925] train_loss: 1.183 train_accuracy: 0.574 test_accuracy: 0.509\n",
            "[5,   930] train_loss: 1.231 train_accuracy: 0.563 test_accuracy: 0.506\n",
            "[5,   935] train_loss: 1.254 train_accuracy: 0.574 test_accuracy: 0.515\n",
            "[5,   940] train_loss: 1.612 train_accuracy: 0.584 test_accuracy: 0.516\n",
            "[5,   945] train_loss: 1.219 train_accuracy: 0.580 test_accuracy: 0.510\n",
            "[5,   950] train_loss: 1.483 train_accuracy: 0.558 test_accuracy: 0.497\n",
            "[5,   955] train_loss: 1.417 train_accuracy: 0.552 test_accuracy: 0.499\n",
            "[5,   960] train_loss: 1.208 train_accuracy: 0.550 test_accuracy: 0.497\n",
            "[5,   965] train_loss: 1.260 train_accuracy: 0.553 test_accuracy: 0.499\n",
            "[5,   970] train_loss: 1.343 train_accuracy: 0.554 test_accuracy: 0.498\n",
            "[5,   975] train_loss: 1.248 train_accuracy: 0.570 test_accuracy: 0.507\n",
            "[5,   980] train_loss: 1.348 train_accuracy: 0.575 test_accuracy: 0.507\n",
            "[5,   985] train_loss: 1.387 train_accuracy: 0.559 test_accuracy: 0.493\n",
            "[5,   990] train_loss: 1.361 train_accuracy: 0.557 test_accuracy: 0.493\n",
            "[5,   995] train_loss: 1.273 train_accuracy: 0.572 test_accuracy: 0.509\n",
            "[5,  1000] train_loss: 1.238 train_accuracy: 0.564 test_accuracy: 0.507\n",
            "[5,  1005] train_loss: 1.475 train_accuracy: 0.570 test_accuracy: 0.512\n",
            "[5,  1010] train_loss: 1.304 train_accuracy: 0.567 test_accuracy: 0.507\n",
            "[5,  1015] train_loss: 1.205 train_accuracy: 0.564 test_accuracy: 0.499\n",
            "[5,  1020] train_loss: 1.238 train_accuracy: 0.574 test_accuracy: 0.506\n",
            "[5,  1025] train_loss: 1.190 train_accuracy: 0.560 test_accuracy: 0.503\n",
            "[5,  1030] train_loss: 1.381 train_accuracy: 0.562 test_accuracy: 0.501\n",
            "[5,  1035] train_loss: 1.299 train_accuracy: 0.551 test_accuracy: 0.495\n",
            "[5,  1040] train_loss: 1.383 train_accuracy: 0.567 test_accuracy: 0.506\n",
            "[5,  1045] train_loss: 1.288 train_accuracy: 0.567 test_accuracy: 0.506\n",
            "[5,  1050] train_loss: 1.233 train_accuracy: 0.557 test_accuracy: 0.502\n",
            "[5,  1055] train_loss: 1.325 train_accuracy: 0.565 test_accuracy: 0.504\n",
            "[5,  1060] train_loss: 1.227 train_accuracy: 0.573 test_accuracy: 0.507\n",
            "[5,  1065] train_loss: 1.219 train_accuracy: 0.570 test_accuracy: 0.503\n",
            "[5,  1070] train_loss: 1.296 train_accuracy: 0.556 test_accuracy: 0.496\n",
            "[5,  1075] train_loss: 1.447 train_accuracy: 0.568 test_accuracy: 0.505\n",
            "[5,  1080] train_loss: 1.388 train_accuracy: 0.568 test_accuracy: 0.511\n",
            "[5,  1085] train_loss: 1.269 train_accuracy: 0.555 test_accuracy: 0.495\n",
            "[5,  1090] train_loss: 1.378 train_accuracy: 0.562 test_accuracy: 0.501\n",
            "[5,  1095] train_loss: 1.321 train_accuracy: 0.569 test_accuracy: 0.506\n",
            "[5,  1100] train_loss: 1.353 train_accuracy: 0.565 test_accuracy: 0.501\n",
            "[5,  1105] train_loss: 1.167 train_accuracy: 0.575 test_accuracy: 0.508\n",
            "[5,  1110] train_loss: 1.342 train_accuracy: 0.570 test_accuracy: 0.512\n",
            "[5,  1115] train_loss: 1.257 train_accuracy: 0.581 test_accuracy: 0.511\n",
            "[5,  1120] train_loss: 1.328 train_accuracy: 0.580 test_accuracy: 0.512\n",
            "[5,  1125] train_loss: 1.280 train_accuracy: 0.582 test_accuracy: 0.513\n",
            "[5,  1130] train_loss: 1.348 train_accuracy: 0.588 test_accuracy: 0.508\n",
            "[5,  1135] train_loss: 1.309 train_accuracy: 0.585 test_accuracy: 0.508\n",
            "[5,  1140] train_loss: 1.294 train_accuracy: 0.575 test_accuracy: 0.503\n",
            "[5,  1145] train_loss: 1.380 train_accuracy: 0.574 test_accuracy: 0.503\n",
            "[5,  1150] train_loss: 1.320 train_accuracy: 0.568 test_accuracy: 0.499\n",
            "[5,  1155] train_loss: 1.311 train_accuracy: 0.574 test_accuracy: 0.508\n",
            "[5,  1160] train_loss: 1.432 train_accuracy: 0.576 test_accuracy: 0.509\n",
            "[5,  1165] train_loss: 1.408 train_accuracy: 0.576 test_accuracy: 0.506\n",
            "[5,  1170] train_loss: 1.353 train_accuracy: 0.573 test_accuracy: 0.503\n",
            "[5,  1175] train_loss: 1.348 train_accuracy: 0.579 test_accuracy: 0.508\n",
            "[5,  1180] train_loss: 1.205 train_accuracy: 0.579 test_accuracy: 0.506\n",
            "[5,  1185] train_loss: 1.149 train_accuracy: 0.580 test_accuracy: 0.508\n",
            "[5,  1190] train_loss: 1.327 train_accuracy: 0.574 test_accuracy: 0.509\n",
            "[5,  1195] train_loss: 1.352 train_accuracy: 0.573 test_accuracy: 0.506\n",
            "[5,  1200] train_loss: 1.356 train_accuracy: 0.575 test_accuracy: 0.504\n",
            "[5,  1205] train_loss: 1.167 train_accuracy: 0.584 test_accuracy: 0.513\n",
            "[5,  1210] train_loss: 1.300 train_accuracy: 0.576 test_accuracy: 0.508\n",
            "[5,  1215] train_loss: 1.323 train_accuracy: 0.572 test_accuracy: 0.503\n",
            "[5,  1220] train_loss: 1.165 train_accuracy: 0.573 test_accuracy: 0.501\n",
            "[5,  1225] train_loss: 1.109 train_accuracy: 0.585 test_accuracy: 0.514\n",
            "[5,  1230] train_loss: 1.353 train_accuracy: 0.587 test_accuracy: 0.516\n",
            "[5,  1235] train_loss: 1.367 train_accuracy: 0.583 test_accuracy: 0.512\n",
            "[5,  1240] train_loss: 1.196 train_accuracy: 0.568 test_accuracy: 0.501\n",
            "[5,  1245] train_loss: 1.298 train_accuracy: 0.570 test_accuracy: 0.501\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "# Writing training accuracy to file\n",
        "with open('Accuracy_a_train.txt', 'w') as file:\n",
        "    for i in range(len(a_train)):\n",
        "        file.write(str(a_train[i]))\n",
        "        if i < len(a_train) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing test accuracy to file\n",
        "with open('Accuracy_a_test.txt', 'w') as file:\n",
        "    for i in range(len(a_test)):\n",
        "        file.write(str(a_test[i]))\n",
        "        if i < len(a_test) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing loss values to file\n",
        "with open('Accuracy_loss.txt', 'w') as file:\n",
        "    for i in range(len(lossaaa)):\n",
        "        file.write(str(lossaaa[i]))\n",
        "        if i < len(lossaaa) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "B4mbvMwlFOMx"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Convert tensors to lists\n",
        "Inf_list = [tensor.item() for tensor in Inf]\n",
        "Var_av_list = [tensor.item() for tensor in Var_all]\n",
        "Generalization_Ratio_list = [tensor.item() for tensor in Generalization_Ratio_]\n",
        "\n",
        "# Writing Inf_list to file\n",
        "with open('Inf_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Inf_list)):\n",
        "        file.write(str(Inf_list[i]))\n",
        "        if i < len(Inf_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Var_av_list to file\n",
        "with open('Var_all_OOD.txt', 'w') as file:\n",
        "    for i in range(len(Var_av_list)):\n",
        "        file.write(str(Var_av_list[i]))\n",
        "        if i < len(Var_av_list) - 1:\n",
        "            file.write(', ')\n",
        "\n",
        "# Writing Generalization_Ratio_list to file\n",
        "with open('Generalization_Ratio_list.txt', 'w') as file:\n",
        "    for i in range(len(Generalization_Ratio_list)):\n",
        "        file.write(str(Generalization_Ratio_list[i]))\n",
        "        if i < len(Generalization_Ratio_list) - 1:\n",
        "            file.write(', ')"
      ],
      "metadata": {
        "id": "g282Q2I1ENff"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "import time\n",
        "import os  # Import the os module\n",
        "\n",
        "os.makedirs(os.path.join('./Models/'), exist_ok=True)  # Create the directory './Models/' if it doesn't exist\n",
        "model_path = './Models/'  # Define the model path\n",
        "\n",
        "rq = time.strftime('%Y%m%d%H%M', time.localtime(time.time()))  # Get the current time in the format 'YYYYMMDDHHMM'\n",
        "\n",
        "# Save the training results\n",
        "current_model_path = model_path + rq + \"_model.pkl\"  # Create the full path for the model file with the current timestamp\n",
        "torch.save(net, current_model_path)  # Save the model to the specified path\n",
        "print(\"Saved model file: \" + current_model_path)  # Print the path of the saved model file"
      ],
      "metadata": {
        "id": "Z51pkCEvFe6t"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# Display the highest value that appears during training\n",
        "print(\"train:\", max(a_train))  # Print the highest value in the training data\n",
        "print(\"test:\", max(a_test))  # Print the highest value in the test data\n",
        "print(\"loss:\", min(lossaaa))  # Print the minimum value of the loss"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "k1RU0d7-FvJp",
        "outputId": "3f6ae37a-2aa0-46b1-9506-9e711d753a6a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "train: 0.5879\n",
            "test: 0.5198\n",
            "loss: 1.0879650712013245\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "trainset = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)  # Load CIFAR-10 training dataset\n",
        "testset = torchvision.datasets.CIFAR10(root='./data', train=False, download=False, transform=transform)  # Load CIFAR-10 test dataset\n",
        "trainloader = torch.utils.data.DataLoader(trainset, batch_size=50000, shuffle=True, num_workers=0)  # Create DataLoader for training set\n",
        "t_loader = torch.utils.data.DataLoader(testset, batch_size=10000, shuffle=False, num_workers=0)  # Create DataLoader for test set\n",
        "\n",
        "trainloader_iter = iter(trainloader)  # Create an iterator for the training DataLoader\n",
        "tl_image, tl_label = next(trainloader_iter)  # Get the next batch of images and labels from the training DataLoader\n",
        "tl_image = tl_image.cuda()  # Move training images to GPU\n",
        "tl_label = tl_label.cuda()  # Move training labels to GPU\n",
        "tl_imageoutputs = net(tl_image)  # [batch, 10]  # Get the outputs from the network for the training images\n",
        "predict_y = torch.max(tl_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy = torch.eq(predict_y, tl_label).sum().item() / tl_label.size(0)  # Calculate accuracy for the training set\n",
        "print(\"train:\", float(accuracy))  # Print the training accuracy\n",
        "\n",
        "t_data_iter = iter(t_loader)  # Create an iterator for the test DataLoader\n",
        "t_image, t_label = next(t_data_iter)  # Get the next batch of images and labels from the test DataLoader\n",
        "t_image = t_image.cuda()  # Move test images to GPU\n",
        "t_label = t_label.cuda()  # Move test labels to GPU\n",
        "t_imageoutputs = net(t_image)  # [batch, 10]  # Get the outputs from the network for the test images\n",
        "predict = torch.max(t_imageoutputs, dim=1)[1]  # Get the predicted labels by finding the max output along dimension 1\n",
        "accuracy_t = torch.eq(predict, t_label).sum().item() / t_label.size(0)  # Calculate accuracy for the test set\n",
        "print(\"test:\", float(accuracy_t))  # Print the test accuracy"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "o4YNgqE0Fyu8",
        "outputId": "0e87802a-fef7-47cd-94f9-b8ed90aa7932"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n",
            "train: 0.56694\n",
            "test: 0.501\n"
          ]
        }
      ]
    }
  ]
}