{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "e63da0ce",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import os\n",
    "import pandas as pd\n",
    "import torch\n",
    "from torch import Tensor\n",
    "from typing import Tuple, List, Callable\n",
    "import random\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "\n",
    "import pdb\n",
    "import time\n",
    "\n",
    "torch.cuda.is_available()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "054927e8",
   "metadata": {},
   "outputs": [],
   "source": [
    "gpu_ids = [5]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "4e23f288",
   "metadata": {},
   "outputs": [],
   "source": [
    "from run import *\n",
    "from utils import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "40fe2848",
   "metadata": {},
   "outputs": [],
   "source": [
    "### TIME_LIMITS and LRs are for simulatiom arguments \n",
    "TIME_LIMITS = {'mnist': 500, 'fashion mnist': 2000  , 'cifar 10': 100000, 'celeba': 1000, 'tinyimagenet': 10000}\n",
    "LRs         = {'mnist': 0.5, 'fashion mnist': 0.0001, 'cifar 10': 0.005, 'celeba': 0.01, 'tinyimagenet': 0.1}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "f91594d2",
   "metadata": {},
   "outputs": [],
   "source": [
    "#dataset_name = 'tinyimagenet'\n",
    "#dataset_name = 'mnist'\n",
    "dataset_name = 'cifar 10'\n",
    "lr = LRs[dataset_name]\n",
    "time_limit = TIME_LIMITS[dataset_name]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "a73d260c",
   "metadata": {},
   "outputs": [],
   "source": [
    "### Here you should define different setups that you want to run and compare.\n",
    "### Each config should be added to the \"setups\" dictionary. Config arguments are difined \n",
    "### by a dictionary from argument_name to value. \n",
    "\n",
    "setups = {}\n",
    "rep=0\n",
    "\n",
    "group_count = 20\n",
    "client_count = 100\n",
    "max_local_steps = 20\n",
    "\n",
    "server_interaction_time = 3\n",
    "server_waiting_time = 4\n",
    "## Fed-Avg config example\n",
    "method = \"identity\"\n",
    "quantizer = {\"method\": method}\n",
    "local_steps = max_local_steps\n",
    "\n",
    "\n",
    "\n",
    "setups[\"FedAvg\"] = {'algorithm': \"Fed_Avg\", \n",
    "                                                                                         'client count': client_count,\n",
    "                                                                                         'local step': local_steps,\n",
    "                                                                                         'group count': group_count,\n",
    "                                                                                         'quantizer': quantizer, \n",
    "                                                                                         'time_limit': time_limit,\n",
    "                                                                                         'lr': lr,\n",
    "                                                                                         'sit': server_interaction_time,\n",
    "                                                                                         'gpu_ids': gpu_ids}\n",
    "\n",
    "setups[\"FedBuff\"] = {'algorithm': \"Fed_Buff\", \n",
    "                                                                                         'client count': client_count,\n",
    "                                                                                         'local step': local_steps,\n",
    "                                                                                         'group count': group_count,\n",
    "                                                                                         'quantizer': quantizer, \n",
    "                                                                                         'time_limit': time_limit,\n",
    "                                                                                         'lr': lr,\n",
    "                                                                                         'sit': server_interaction_time,\n",
    "                                                                                         'gpu_ids': gpu_ids}\n",
    "setups[\"QuAFL\"] = {'algorithm': \"quantized_fl\", \n",
    "                                                                                          'client count': client_count,\n",
    "                                                                                          'local step': max_local_steps,\n",
    "                                                                                          'group count': group_count,\n",
    "                                                                                          'quantizer': quantizer, \n",
    "                                                                                          'time_limit': time_limit,\n",
    "                                                                                          'lr': lr,\n",
    "                                                                                          'swt': server_waiting_time,\n",
    "                                                                                          'sit': server_interaction_time,\n",
    "                                                                                          'gpu_ids': gpu_ids,\n",
    "                                                                                          'client_averaging': True,\n",
    "                                                                                          'server_averaging': True,}\n",
    "\n",
    "setups[\"FAVAS\"] = {'algorithm': \"FLASQ_reweight_avg\", \n",
    "                                                                                          'client count': client_count,\n",
    "                                                                                          'local step': max_local_steps,\n",
    "                                                                                          'group count': group_count,\n",
    "                                                                                          'quantizer': quantizer, \n",
    "                                                                                          'time_limit': time_limit,\n",
    "                                                                                          'lr': lr,\n",
    "                                                                                          'swt': server_waiting_time,\n",
    "                                                                                          'sit': server_interaction_time,\n",
    "                                                                                          'gpu_ids': gpu_ids,\n",
    "                                                                                          'client_averaging': False,\n",
    "                                                                                          'server_averaging': True,}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "91408e6d",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading cifar_10_hetero_qnn dataset.\n",
      "/data/louis/cifar10/\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "--- FedAvg ---\n",
      "ResNetCifar(\n",
      "  (conv1): Conv2d_LUQ(3, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "  (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "  (relu): ReLU(inplace=True)\n",
      "  (layer1): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (layer2): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "      (downsample): Sequential(\n",
      "        (0): Conv2d_LUQ(16, 32, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "        (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      )\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (layer3): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 64, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "      (downsample): Sequential(\n",
      "        (0): Conv2d_LUQ(32, 64, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "        (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      )\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (avgpool): AvgPool2d(kernel_size=8, stride=1, padding=0)\n",
      "  (fc): Linear(in_features=64, out_features=10, bias=True)\n",
      ")\n",
      "Client 1 is added to the population.\n",
      "Client 2 is added to the population.\n",
      "Client 3 is added to the population.\n",
      "Client 4 is added to the population.\n",
      "Client 5 is added to the population.\n",
      "Client 6 is added to the population.\n",
      "Client 7 is added to the population.\n",
      "Client 8 is added to the population.\n",
      "Client 9 is added to the population.\n",
      "Client 10 is added to the population.\n",
      "Client 11 is added to the population.\n",
      "Client 12 is added to the population.\n",
      "Client 13 is added to the population.\n",
      "Client 14 is added to the population.\n",
      "Client 15 is added to the population.\n",
      "Client 16 is added to the population.\n",
      "Client 17 is added to the population.\n",
      "Client 18 is added to the population.\n",
      "Client 19 is added to the population.\n",
      "Client 20 is added to the population.\n",
      "Client 21 is added to the population.\n",
      "Client 22 is added to the population.\n",
      "Client 23 is added to the population.\n",
      "Client 24 is added to the population.\n",
      "Client 25 is added to the population.\n",
      "Client 26 is added to the population.\n",
      "Client 27 is added to the population.\n",
      "Client 28 is added to the population.\n",
      "Client 29 is added to the population.\n",
      "Client 30 is added to the population.\n",
      "Client 31 is added to the population.\n",
      "Client 32 is added to the population.\n",
      "Client 33 is added to the population.\n",
      "Client 34 is added to the population.\n",
      "Client 35 is added to the population.\n",
      "Client 36 is added to the population.\n",
      "Client 37 is added to the population.\n",
      "Client 38 is added to the population.\n",
      "Client 39 is added to the population.\n",
      "Client 40 is added to the population.\n",
      "Client 41 is added to the population.\n",
      "Client 42 is added to the population.\n",
      "Client 43 is added to the population.\n",
      "Client 44 is added to the population.\n",
      "Client 45 is added to the population.\n",
      "Client 46 is added to the population.\n",
      "Client 47 is added to the population.\n",
      "Client 48 is added to the population.\n",
      "Client 49 is added to the population.\n",
      "Client 50 is added to the population.\n",
      "Client 51 is added to the population.\n",
      "Client 52 is added to the population.\n",
      "Client 53 is added to the population.\n",
      "Client 54 is added to the population.\n",
      "Client 55 is added to the population.\n",
      "Client 56 is added to the population.\n",
      "Client 57 is added to the population.\n",
      "Client 58 is added to the population.\n",
      "Client 59 is added to the population.\n",
      "Client 60 is added to the population.\n",
      "Client 61 is added to the population.\n",
      "Client 62 is added to the population.\n",
      "Client 63 is added to the population.\n",
      "Client 64 is added to the population.\n",
      "Client 65 is added to the population.\n",
      "Client 66 is added to the population.\n",
      "Client 67 is added to the population.\n",
      "Client 68 is added to the population.\n",
      "Client 69 is added to the population.\n",
      "Client 70 is added to the population.\n",
      "Client 71 is added to the population.\n",
      "Client 72 is added to the population.\n",
      "Client 73 is added to the population.\n",
      "Client 74 is added to the population.\n",
      "Client 75 is added to the population.\n",
      "Client 76 is added to the population.\n",
      "Client 77 is added to the population.\n",
      "Client 78 is added to the population.\n",
      "Client 79 is added to the population.\n",
      "Client 80 is added to the population.\n",
      "Client 81 is added to the population.\n",
      "Client 82 is added to the population.\n",
      "Client 83 is added to the population.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Client 84 is added to the population.\n",
      "Client 85 is added to the population.\n",
      "Client 86 is added to the population.\n",
      "Client 87 is added to the population.\n",
      "Client 88 is added to the population.\n",
      "Client 89 is added to the population.\n",
      "Client 90 is added to the population.\n",
      "Client 91 is added to the population.\n",
      "Client 92 is added to the population.\n",
      "Client 93 is added to the population.\n",
      "Client 94 is added to the population.\n",
      "Client 95 is added to the population.\n",
      "Client 96 is added to the population.\n",
      "Client 97 is added to the population.\n",
      "Client 98 is added to the population.\n",
      "Client 99 is added to the population.\n",
      "Client 100 is added to the population.\n",
      "0.0\n",
      "Train: Step:     0 Val-Loss: 2.8170  Val-Acc: 0.10 Time:   0.00 Local Steps:     0\n",
      "16.599344\n",
      "Train: Step:     1 Val-Loss: 2.3509  Val-Acc: 0.07 Time: 357.14 Local Steps:   400\n",
      "26.474083\n",
      "Train: Step:     2 Val-Loss: 2.3365  Val-Acc: 0.10 Time: 794.46 Local Steps:   800\n",
      "28.71138\n",
      "Train: Step:     3 Val-Loss: 2.3254  Val-Acc: 0.11 Time: 1216.41 Local Steps:  1200\n",
      "31.287514\n",
      "Train: Step:     4 Val-Loss: 2.3452  Val-Acc: 0.11 Time: 1634.17 Local Steps:  1600\n",
      "34.15632\n",
      "Train: Step:     5 Val-Loss: 2.3405  Val-Acc: 0.12 Time: 2028.60 Local Steps:  2000\n",
      "34.32169\n",
      "Train: Step:     6 Val-Loss: 2.3296  Val-Acc: 0.11 Time: 2519.66 Local Steps:  2400\n",
      "36.845715\n",
      "Train: Step:     7 Val-Loss: 2.3541  Val-Acc: 0.10 Time: 2945.43 Local Steps:  2800\n",
      "36.810234\n",
      "Train: Step:     8 Val-Loss: 2.3513  Val-Acc: 0.11 Time: 3321.71 Local Steps:  3200\n",
      "36.0167\n",
      "Train: Step:     9 Val-Loss: 2.3152  Val-Acc: 0.12 Time: 3740.97 Local Steps:  3600\n",
      "36.09433\n",
      "Train: Step:    10 Val-Loss: 2.3099  Val-Acc: 0.13 Time: 4170.42 Local Steps:  4000\n",
      "36.83458\n",
      "Train: Step:    11 Val-Loss: 2.3283  Val-Acc: 0.16 Time: 4574.37 Local Steps:  4400\n",
      "36.77033\n",
      "Train: Step:    12 Val-Loss: 2.3234  Val-Acc: 0.15 Time: 4931.33 Local Steps:  4800\n",
      "37.029564\n",
      "Train: Step:    13 Val-Loss: 2.2952  Val-Acc: 0.15 Time: 5353.55 Local Steps:  5200\n",
      "37.559296\n",
      "Train: Step:    14 Val-Loss: 2.2796  Val-Acc: 0.14 Time: 5708.58 Local Steps:  5600\n",
      "37.255592\n",
      "Train: Step:    15 Val-Loss: 2.2724  Val-Acc: 0.15 Time: 6159.03 Local Steps:  6000\n",
      "37.7659\n",
      "Train: Step:    16 Val-Loss: 2.2699  Val-Acc: 0.16 Time: 6575.09 Local Steps:  6400\n",
      "38.421837\n",
      "Train: Step:    17 Val-Loss: 2.2847  Val-Acc: 0.13 Time: 6972.08 Local Steps:  6800\n",
      "37.771355\n",
      "Train: Step:    18 Val-Loss: 2.2588  Val-Acc: 0.15 Time: 7402.59 Local Steps:  7200\n",
      "37.848816\n",
      "Train: Step:    19 Val-Loss: 2.2576  Val-Acc: 0.18 Time: 7759.08 Local Steps:  7600\n",
      "37.916138\n",
      "Train: Step:    20 Val-Loss: 2.2519  Val-Acc: 0.19 Time: 8129.54 Local Steps:  8000\n",
      "38.579216\n",
      "Train: Step:    21 Val-Loss: 2.2932  Val-Acc: 0.17 Time: 8533.49 Local Steps:  8400\n",
      "38.280327\n",
      "Train: Step:    22 Val-Loss: 2.2612  Val-Acc: 0.19 Time: 8877.95 Local Steps:  8800\n",
      "38.62787\n",
      "Train: Step:    23 Val-Loss: 2.2390  Val-Acc: 0.16 Time: 9233.48 Local Steps:  9200\n",
      "39.84896\n",
      "Train: Step:    24 Val-Loss: 2.2433  Val-Acc: 0.17 Time: 9624.49 Local Steps:  9600\n",
      "39.314613\n",
      "Train: Step:    25 Val-Loss: 2.2624  Val-Acc: 0.14 Time: 10136.78 Local Steps: 10000\n",
      "38.72184\n",
      "Train: Step:    26 Val-Loss: 2.2397  Val-Acc: 0.14 Time: 10592.07 Local Steps: 10400\n",
      "38.77887\n",
      "Train: Step:    29 Val-Loss: 2.1808  Val-Acc: 0.21 Time: 11769.03 Local Steps: 11600\n",
      "39.301758\n",
      "Train: Step:    30 Val-Loss: 2.1772  Val-Acc: 0.20 Time: 12290.26 Local Steps: 12000\n",
      "38.6615\n",
      "Train: Step:    31 Val-Loss: 2.1503  Val-Acc: 0.21 Time: 12801.60 Local Steps: 12400\n",
      "39.545883\n",
      "Train: Step:    32 Val-Loss: 2.1586  Val-Acc: 0.19 Time: 13168.12 Local Steps: 12800\n",
      "38.93248\n",
      "Train: Step:    33 Val-Loss: 2.1322  Val-Acc: 0.21 Time: 13512.49 Local Steps: 13200\n",
      "39.35407\n",
      "Train: Step:    34 Val-Loss: 2.1219  Val-Acc: 0.23 Time: 13883.91 Local Steps: 13600\n",
      "39.280457\n",
      "Train: Step:    35 Val-Loss: 2.1261  Val-Acc: 0.21 Time: 14274.54 Local Steps: 14000\n",
      "40.06376\n",
      "Train: Step:    36 Val-Loss: 2.1300  Val-Acc: 0.21 Time: 14612.99 Local Steps: 14400\n",
      "39.121857\n",
      "Train: Step:    37 Val-Loss: 2.1189  Val-Acc: 0.22 Time: 14970.73 Local Steps: 14800\n",
      "39.072815\n",
      "Train: Step:    38 Val-Loss: 2.1041  Val-Acc: 0.21 Time: 15446.32 Local Steps: 15200\n",
      "39.02048\n",
      "Train: Step:    39 Val-Loss: 2.1184  Val-Acc: 0.21 Time: 15856.85 Local Steps: 15600\n",
      "39.342712\n",
      "Train: Step:    40 Val-Loss: 2.1072  Val-Acc: 0.22 Time: 16278.13 Local Steps: 16000\n",
      "39.820328\n",
      "Train: Step:    41 Val-Loss: 2.1791  Val-Acc: 0.19 Time: 16711.56 Local Steps: 16400\n",
      "40.331837\n",
      "Train: Step:    42 Val-Loss: 2.2124  Val-Acc: 0.15 Time: 17141.58 Local Steps: 16800\n",
      "39.01625\n",
      "Train: Step:    43 Val-Loss: 2.1275  Val-Acc: 0.20 Time: 17610.73 Local Steps: 17200\n",
      "38.99269\n",
      "Train: Step:    44 Val-Loss: 2.1276  Val-Acc: 0.21 Time: 17995.86 Local Steps: 17600\n",
      "39.57177\n",
      "Train: Step:    45 Val-Loss: 2.1270  Val-Acc: 0.21 Time: 18413.22 Local Steps: 18000\n",
      "40.107853\n",
      "Train: Step:    46 Val-Loss: 2.1545  Val-Acc: 0.21 Time: 18900.37 Local Steps: 18400\n",
      "39.26777\n",
      "Train: Step:    47 Val-Loss: 2.1113  Val-Acc: 0.22 Time: 19343.69 Local Steps: 18800\n",
      "38.405495\n",
      "Train: Step:    48 Val-Loss: 2.0672  Val-Acc: 0.23 Time: 19753.17 Local Steps: 19200\n",
      "38.980103\n",
      "Train: Step:    49 Val-Loss: 2.0787  Val-Acc: 0.21 Time: 20148.68 Local Steps: 19600\n",
      "39.58344\n",
      "Train: Step:    50 Val-Loss: 2.0605  Val-Acc: 0.22 Time: 20533.01 Local Steps: 20000\n",
      "38.928585\n",
      "Train: Step:    51 Val-Loss: 2.0831  Val-Acc: 0.20 Time: 20939.91 Local Steps: 20400\n",
      "39.344723\n",
      "Train: Step:    52 Val-Loss: 2.1133  Val-Acc: 0.18 Time: 21326.00 Local Steps: 20800\n",
      "39.032707\n",
      "Train: Step:    53 Val-Loss: 2.0904  Val-Acc: 0.22 Time: 21712.76 Local Steps: 21200\n",
      "39.206207\n",
      "Train: Step:    54 Val-Loss: 2.0852  Val-Acc: 0.22 Time: 22128.59 Local Steps: 21600\n",
      "39.424706\n",
      "Train: Step:    55 Val-Loss: 2.0991  Val-Acc: 0.20 Time: 22550.24 Local Steps: 22000\n",
      "39.07972\n",
      "Train: Step:    56 Val-Loss: 2.1032  Val-Acc: 0.20 Time: 22957.08 Local Steps: 22400\n",
      "38.93505\n",
      "Train: Step:    57 Val-Loss: 2.0903  Val-Acc: 0.20 Time: 23365.12 Local Steps: 22800\n",
      "38.157066\n",
      "Train: Step:    58 Val-Loss: 2.0648  Val-Acc: 0.22 Time: 23862.08 Local Steps: 23200\n",
      "38.943237\n",
      "Train: Step:    59 Val-Loss: 2.0706  Val-Acc: 0.20 Time: 24248.87 Local Steps: 23600\n",
      "38.23831\n",
      "Train: Step:    60 Val-Loss: 2.0341  Val-Acc: 0.24 Time: 24719.58 Local Steps: 24000\n",
      "38.742867\n",
      "Train: Step:    61 Val-Loss: 2.0315  Val-Acc: 0.23 Time: 25108.02 Local Steps: 24400\n",
      "37.924137\n",
      "Train: Step:    62 Val-Loss: 2.0664  Val-Acc: 0.23 Time: 25541.46 Local Steps: 24800\n",
      "38.525276\n",
      "Train: Step:    63 Val-Loss: 2.0733  Val-Acc: 0.20 Time: 25961.59 Local Steps: 25200\n",
      "38.71523\n",
      "Train: Step:    64 Val-Loss: 2.0654  Val-Acc: 0.21 Time: 26463.85 Local Steps: 25600\n",
      "38.734264\n",
      "Train: Step:    65 Val-Loss: 2.0843  Val-Acc: 0.22 Time: 26824.14 Local Steps: 26000\n",
      "38.281425\n",
      "Train: Step:    66 Val-Loss: 2.0648  Val-Acc: 0.23 Time: 27264.29 Local Steps: 26400\n",
      "38.67792\n",
      "Train: Step:    67 Val-Loss: 2.0915  Val-Acc: 0.22 Time: 27705.48 Local Steps: 26800\n",
      "39.018677\n",
      "Train: Step:    68 Val-Loss: 2.1520  Val-Acc: 0.18 Time: 28131.23 Local Steps: 27200\n",
      "37.95972\n",
      "Train: Step:    69 Val-Loss: 2.0636  Val-Acc: 0.23 Time: 28605.86 Local Steps: 27600\n",
      "38.49373\n",
      "Train: Step:    70 Val-Loss: 2.0877  Val-Acc: 0.22 Time: 28948.79 Local Steps: 28000\n",
      "38.135353\n",
      "Train: Step:    71 Val-Loss: 2.0797  Val-Acc: 0.24 Time: 29277.53 Local Steps: 28400\n",
      "38.30313\n",
      "Train: Step:    72 Val-Loss: 2.0260  Val-Acc: 0.24 Time: 29637.41 Local Steps: 28800\n",
      "38.006065\n",
      "Train: Step:    73 Val-Loss: 2.0690  Val-Acc: 0.22 Time: 30147.64 Local Steps: 29200\n",
      "38.11696\n",
      "Train: Step:    74 Val-Loss: 2.0642  Val-Acc: 0.25 Time: 30609.02 Local Steps: 29600\n",
      "38.340797\n",
      "Train: Step:    75 Val-Loss: 2.0668  Val-Acc: 0.23 Time: 31006.05 Local Steps: 30000\n",
      "37.89698\n",
      "Train: Step:    76 Val-Loss: 2.0532  Val-Acc: 0.23 Time: 31338.66 Local Steps: 30400\n",
      "37.758324\n",
      "Train: Step:    77 Val-Loss: 2.0311  Val-Acc: 0.23 Time: 31674.32 Local Steps: 30800\n",
      "38.24181\n",
      "Train: Step:    78 Val-Loss: 2.0035  Val-Acc: 0.24 Time: 32057.51 Local Steps: 31200\n",
      "38.56048\n",
      "Train: Step:    79 Val-Loss: 2.0530  Val-Acc: 0.23 Time: 32426.05 Local Steps: 31600\n",
      "38.801376\n",
      "Train: Step:    80 Val-Loss: 2.0499  Val-Acc: 0.24 Time: 32835.90 Local Steps: 32000\n",
      "38.47892\n",
      "Train: Step:    81 Val-Loss: 2.0567  Val-Acc: 0.24 Time: 33197.34 Local Steps: 32400\n",
      "38.326447\n",
      "Train: Step:    82 Val-Loss: 2.0575  Val-Acc: 0.23 Time: 33640.59 Local Steps: 32800\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "38.611076\n",
      "Train: Step:    83 Val-Loss: 2.0824  Val-Acc: 0.21 Time: 33998.57 Local Steps: 33200\n",
      "38.772392\n",
      "Train: Step:    84 Val-Loss: 2.0704  Val-Acc: 0.21 Time: 34472.17 Local Steps: 33600\n",
      "38.472717\n",
      "Train: Step:    85 Val-Loss: 2.0597  Val-Acc: 0.22 Time: 34818.69 Local Steps: 34000\n",
      "38.294933\n",
      "Train: Step:    86 Val-Loss: 2.0312  Val-Acc: 0.25 Time: 35199.66 Local Steps: 34400\n",
      "38.29233\n",
      "Train: Step:    87 Val-Loss: 2.0425  Val-Acc: 0.25 Time: 35716.74 Local Steps: 34800\n",
      "38.157967\n",
      "Train: Step:    88 Val-Loss: 2.0304  Val-Acc: 0.24 Time: 36162.83 Local Steps: 35200\n",
      "38.53066\n",
      "Train: Step:    89 Val-Loss: 2.0042  Val-Acc: 0.26 Time: 36581.63 Local Steps: 35600\n",
      "37.949287\n",
      "Train: Step:    90 Val-Loss: 2.0044  Val-Acc: 0.26 Time: 36965.08 Local Steps: 36000\n",
      "37.6323\n",
      "Train: Step:    91 Val-Loss: 1.9845  Val-Acc: 0.27 Time: 37418.46 Local Steps: 36400\n",
      "37.57313\n",
      "Train: Step:    92 Val-Loss: 1.9841  Val-Acc: 0.24 Time: 37896.65 Local Steps: 36800\n",
      "37.561047\n",
      "Train: Step:    93 Val-Loss: 2.0006  Val-Acc: 0.26 Time: 38353.54 Local Steps: 37200\n",
      "37.365604\n",
      "Train: Step:    94 Val-Loss: 1.9798  Val-Acc: 0.24 Time: 38734.34 Local Steps: 37600\n",
      "37.852325\n",
      "Train: Step:    95 Val-Loss: 1.9800  Val-Acc: 0.26 Time: 39108.68 Local Steps: 38000\n",
      "37.4809\n",
      "Train: Step:    96 Val-Loss: 1.9662  Val-Acc: 0.26 Time: 39590.26 Local Steps: 38400\n",
      "37.44032\n",
      "Train: Step:    97 Val-Loss: 2.0041  Val-Acc: 0.24 Time: 40086.21 Local Steps: 38800\n",
      "37.624832\n",
      "Train: Step:    98 Val-Loss: 2.0014  Val-Acc: 0.25 Time: 40545.76 Local Steps: 39200\n",
      "37.757637\n",
      "Train: Step:    99 Val-Loss: 1.9843  Val-Acc: 0.24 Time: 40923.49 Local Steps: 39600\n",
      "37.537163\n",
      "Train: Step:   100 Val-Loss: 1.9855  Val-Acc: 0.25 Time: 41382.03 Local Steps: 40000\n",
      "37.51159\n",
      "Train: Step:   101 Val-Loss: 1.9808  Val-Acc: 0.23 Time: 41808.76 Local Steps: 40400\n",
      "37.480034\n",
      "Train: Step:   102 Val-Loss: 1.9749  Val-Acc: 0.25 Time: 42179.95 Local Steps: 40800\n",
      "36.91172\n",
      "Train: Step:   103 Val-Loss: 1.9924  Val-Acc: 0.26 Time: 42702.01 Local Steps: 41200\n",
      "37.528503\n",
      "Train: Step:   104 Val-Loss: 1.9863  Val-Acc: 0.23 Time: 43149.67 Local Steps: 41600\n",
      "36.97396\n",
      "Train: Step:   105 Val-Loss: 1.9839  Val-Acc: 0.25 Time: 43657.46 Local Steps: 42000\n",
      "37.11824\n",
      "Train: Step:   106 Val-Loss: 1.9829  Val-Acc: 0.26 Time: 44077.27 Local Steps: 42400\n",
      "36.982227\n",
      "Train: Step:   107 Val-Loss: 1.9850  Val-Acc: 0.26 Time: 44512.37 Local Steps: 42800\n",
      "37.329353\n",
      "Train: Step:   108 Val-Loss: 1.9824  Val-Acc: 0.25 Time: 44958.51 Local Steps: 43200\n",
      "37.273483\n",
      "Train: Step:   109 Val-Loss: 1.9991  Val-Acc: 0.23 Time: 45373.97 Local Steps: 43600\n",
      "37.355167\n",
      "Train: Step:   110 Val-Loss: 1.9997  Val-Acc: 0.24 Time: 45766.90 Local Steps: 44000\n",
      "36.980125\n",
      "Train: Step:   111 Val-Loss: 2.0061  Val-Acc: 0.25 Time: 46263.72 Local Steps: 44400\n",
      "37.776787\n",
      "Train: Step:   112 Val-Loss: 2.0677  Val-Acc: 0.16 Time: 46605.32 Local Steps: 44800\n",
      "37.38894\n",
      "Train: Step:   113 Val-Loss: 2.0357  Val-Acc: 0.21 Time: 47067.92 Local Steps: 45200\n",
      "37.46747\n",
      "Train: Step:   114 Val-Loss: 1.9924  Val-Acc: 0.25 Time: 47496.65 Local Steps: 45600\n",
      "37.77163\n",
      "Train: Step:   115 Val-Loss: 1.9795  Val-Acc: 0.28 Time: 47929.78 Local Steps: 46000\n",
      "37.58718\n",
      "Train: Step:   116 Val-Loss: 1.9953  Val-Acc: 0.25 Time: 48289.56 Local Steps: 46400\n",
      "37.450584\n",
      "Train: Step:   117 Val-Loss: 1.9807  Val-Acc: 0.24 Time: 48706.21 Local Steps: 46800\n",
      "37.104607\n",
      "Train: Step:   118 Val-Loss: 1.9930  Val-Acc: 0.26 Time: 49113.63 Local Steps: 47200\n",
      "37.308342\n",
      "Train: Step:   119 Val-Loss: 1.9750  Val-Acc: 0.24 Time: 49506.20 Local Steps: 47600\n",
      "37.75394\n",
      "Train: Step:   120 Val-Loss: 2.0047  Val-Acc: 0.24 Time: 49889.58 Local Steps: 48000\n",
      "37.769882\n",
      "Train: Step:   121 Val-Loss: 1.9935  Val-Acc: 0.24 Time: 50182.84 Local Steps: 48400\n",
      "37.67655\n",
      "Train: Step:   124 Val-Loss: 1.9973  Val-Acc: 0.24 Time: 51414.33 Local Steps: 49600\n",
      "37.457993\n",
      "Train: Step:   125 Val-Loss: 1.9968  Val-Acc: 0.25 Time: 51810.60 Local Steps: 50000\n",
      "37.6499\n",
      "Train: Step:   126 Val-Loss: 2.0398  Val-Acc: 0.21 Time: 52235.02 Local Steps: 50400\n",
      "37.63638\n",
      "Train: Step:   127 Val-Loss: 1.9995  Val-Acc: 0.25 Time: 52612.10 Local Steps: 50800\n",
      "37.69495\n",
      "Train: Step:   128 Val-Loss: 1.9958  Val-Acc: 0.25 Time: 53147.49 Local Steps: 51200\n",
      "37.72767\n",
      "Train: Step:   129 Val-Loss: 2.0037  Val-Acc: 0.22 Time: 53456.82 Local Steps: 51600\n",
      "37.423412\n",
      "Train: Step:   130 Val-Loss: 1.9684  Val-Acc: 0.27 Time: 54023.80 Local Steps: 52000\n",
      "37.811882\n",
      "Train: Step:   131 Val-Loss: 1.9949  Val-Acc: 0.23 Time: 54459.75 Local Steps: 52400\n",
      "38.027565\n",
      "Train: Step:   132 Val-Loss: 1.9352  Val-Acc: 0.26 Time: 54782.32 Local Steps: 52800\n",
      "37.70002\n",
      "Train: Step:   133 Val-Loss: 1.9118  Val-Acc: 0.28 Time: 55178.26 Local Steps: 53200\n",
      "37.548416\n",
      "Train: Step:   134 Val-Loss: 1.9443  Val-Acc: 0.25 Time: 55552.98 Local Steps: 53600\n",
      "37.73587\n",
      "Train: Step:   135 Val-Loss: 1.9236  Val-Acc: 0.28 Time: 56062.87 Local Steps: 54000\n",
      "37.384407\n",
      "Train: Step:   136 Val-Loss: 1.9614  Val-Acc: 0.24 Time: 56375.10 Local Steps: 54400\n",
      "37.07959\n",
      "Train: Step:   137 Val-Loss: 1.9525  Val-Acc: 0.27 Time: 56881.63 Local Steps: 54800\n",
      "37.1755\n",
      "Train: Step:   138 Val-Loss: 1.9780  Val-Acc: 0.27 Time: 57315.24 Local Steps: 55200\n",
      "37.864655\n",
      "Train: Step:   139 Val-Loss: 2.0297  Val-Acc: 0.24 Time: 57663.56 Local Steps: 55600\n",
      "37.77735\n",
      "Train: Step:   140 Val-Loss: 2.0202  Val-Acc: 0.25 Time: 58138.27 Local Steps: 56000\n",
      "37.823456\n",
      "Train: Step:   141 Val-Loss: 2.0442  Val-Acc: 0.23 Time: 58508.51 Local Steps: 56400\n",
      "37.202644\n",
      "Train: Step:   142 Val-Loss: 1.9933  Val-Acc: 0.27 Time: 59031.07 Local Steps: 56800\n",
      "37.447815\n",
      "Train: Step:   143 Val-Loss: 2.0321  Val-Acc: 0.25 Time: 59509.76 Local Steps: 57200\n",
      "36.778755\n",
      "Train: Step:   144 Val-Loss: 1.9924  Val-Acc: 0.26 Time: 59974.00 Local Steps: 57600\n",
      "37.1427\n",
      "Train: Step:   145 Val-Loss: 1.9677  Val-Acc: 0.26 Time: 60464.21 Local Steps: 58000\n",
      "37.604477\n",
      "Train: Step:   146 Val-Loss: 1.9807  Val-Acc: 0.23 Time: 60794.92 Local Steps: 58400\n",
      "36.644337\n",
      "Train: Step:   147 Val-Loss: 1.9505  Val-Acc: 0.28 Time: 61435.26 Local Steps: 58800\n",
      "36.8722\n",
      "Train: Step:   148 Val-Loss: 1.9552  Val-Acc: 0.25 Time: 61875.82 Local Steps: 59200\n",
      "36.54698\n",
      "Train: Step:   149 Val-Loss: 1.9381  Val-Acc: 0.27 Time: 62224.82 Local Steps: 59600\n",
      "36.731346\n",
      "Train: Step:   150 Val-Loss: 1.9419  Val-Acc: 0.27 Time: 62637.92 Local Steps: 60000\n",
      "36.309086\n",
      "Train: Step:   151 Val-Loss: 1.9716  Val-Acc: 0.25 Time: 62991.23 Local Steps: 60400\n",
      "36.44406\n",
      "Train: Step:   152 Val-Loss: 1.9807  Val-Acc: 0.24 Time: 63412.86 Local Steps: 60800\n",
      "36.874504\n",
      "Train: Step:   153 Val-Loss: 1.9477  Val-Acc: 0.26 Time: 63797.54 Local Steps: 61200\n",
      "36.97881\n",
      "Train: Step:   154 Val-Loss: 1.9457  Val-Acc: 0.28 Time: 64199.84 Local Steps: 61600\n",
      "36.448807\n",
      "Train: Step:   155 Val-Loss: 1.9282  Val-Acc: 0.28 Time: 64667.71 Local Steps: 62000\n",
      "36.699097\n",
      "Train: Step:   156 Val-Loss: 1.9635  Val-Acc: 0.26 Time: 65142.13 Local Steps: 62400\n",
      "36.403576\n",
      "Train: Step:   157 Val-Loss: 1.9596  Val-Acc: 0.27 Time: 65550.67 Local Steps: 62800\n",
      "36.196526\n",
      "Train: Step:   158 Val-Loss: 1.9263  Val-Acc: 0.26 Time: 65991.45 Local Steps: 63200\n",
      "36.497643\n",
      "Train: Step:   159 Val-Loss: 1.9356  Val-Acc: 0.26 Time: 66355.42 Local Steps: 63600\n",
      "36.513668\n",
      "Train: Step:   160 Val-Loss: 1.9071  Val-Acc: 0.30 Time: 66712.86 Local Steps: 64000\n",
      "36.113914\n",
      "Train: Step:   161 Val-Loss: 1.9273  Val-Acc: 0.29 Time: 67183.08 Local Steps: 64400\n",
      "36.8998\n",
      "Train: Step:   162 Val-Loss: 1.9710  Val-Acc: 0.22 Time: 67624.77 Local Steps: 64800\n",
      "36.553608\n",
      "Train: Step:   163 Val-Loss: 1.9366  Val-Acc: 0.27 Time: 68060.87 Local Steps: 65200\n",
      "36.35402\n",
      "Train: Step:   164 Val-Loss: 1.9403  Val-Acc: 0.25 Time: 68377.61 Local Steps: 65600\n",
      "36.02107\n",
      "Train: Step:   165 Val-Loss: 1.9616  Val-Acc: 0.27 Time: 68849.28 Local Steps: 66000\n",
      "36.321793\n",
      "Train: Step:   166 Val-Loss: 1.9712  Val-Acc: 0.26 Time: 69198.71 Local Steps: 66400\n",
      "37.35437\n",
      "Train: Step:   167 Val-Loss: 2.0304  Val-Acc: 0.23 Time: 69591.07 Local Steps: 66800\n",
      "36.494827\n",
      "Train: Step:   168 Val-Loss: 1.9435  Val-Acc: 0.26 Time: 70001.60 Local Steps: 67200\n",
      "36.215256\n",
      "Train: Step:   169 Val-Loss: 1.9416  Val-Acc: 0.25 Time: 70449.23 Local Steps: 67600\n",
      "36.477623\n",
      "Train: Step:   170 Val-Loss: 1.9214  Val-Acc: 0.26 Time: 70861.18 Local Steps: 68000\n",
      "36.24897\n",
      "Train: Step:   171 Val-Loss: 1.9056  Val-Acc: 0.27 Time: 71242.35 Local Steps: 68400\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36.39266\n",
      "Train: Step:   172 Val-Loss: 1.9443  Val-Acc: 0.28 Time: 71668.67 Local Steps: 68800\n",
      "36.12393\n",
      "Train: Step:   173 Val-Loss: 1.9262  Val-Acc: 0.27 Time: 72025.21 Local Steps: 69200\n",
      "36.09707\n",
      "Train: Step:   174 Val-Loss: 1.9169  Val-Acc: 0.27 Time: 72419.63 Local Steps: 69600\n",
      "36.13823\n",
      "Train: Step:   175 Val-Loss: 1.9476  Val-Acc: 0.26 Time: 72826.41 Local Steps: 70000\n",
      "36.17119\n",
      "Train: Step:   176 Val-Loss: 1.9173  Val-Acc: 0.28 Time: 73288.37 Local Steps: 70400\n",
      "36.503044\n",
      "Train: Step:   177 Val-Loss: 1.9516  Val-Acc: 0.27 Time: 73694.01 Local Steps: 70800\n",
      "36.10665\n",
      "Train: Step:   178 Val-Loss: 1.9216  Val-Acc: 0.28 Time: 74137.35 Local Steps: 71200\n",
      "36.79614\n",
      "Train: Step:   179 Val-Loss: 1.9375  Val-Acc: 0.26 Time: 74543.37 Local Steps: 71600\n",
      "37.12211\n",
      "Train: Step:   180 Val-Loss: 1.9376  Val-Acc: 0.29 Time: 74923.96 Local Steps: 72000\n",
      "36.40289\n",
      "Train: Step:   181 Val-Loss: 1.9450  Val-Acc: 0.27 Time: 75312.04 Local Steps: 72400\n",
      "36.158295\n",
      "Train: Step:   182 Val-Loss: 1.9045  Val-Acc: 0.28 Time: 75725.78 Local Steps: 72800\n",
      "36.01396\n",
      "Train: Step:   183 Val-Loss: 1.8908  Val-Acc: 0.30 Time: 76187.22 Local Steps: 73200\n",
      "35.64772\n",
      "Train: Step:   184 Val-Loss: 1.8844  Val-Acc: 0.29 Time: 76604.97 Local Steps: 73600\n",
      "36.27972\n",
      "Train: Step:   185 Val-Loss: 1.9468  Val-Acc: 0.26 Time: 77023.51 Local Steps: 74000\n",
      "36.354034\n",
      "Train: Step:   186 Val-Loss: 1.8920  Val-Acc: 0.28 Time: 77447.72 Local Steps: 74400\n",
      "36.444656\n",
      "Train: Step:   187 Val-Loss: 1.8649  Val-Acc: 0.28 Time: 77828.60 Local Steps: 74800\n",
      "36.095795\n",
      "Train: Step:   188 Val-Loss: 1.8683  Val-Acc: 0.29 Time: 78217.09 Local Steps: 75200\n",
      "36.03718\n",
      "Train: Step:   189 Val-Loss: 1.8851  Val-Acc: 0.29 Time: 78650.75 Local Steps: 75600\n",
      "35.856926\n",
      "Train: Step:   190 Val-Loss: 1.8809  Val-Acc: 0.29 Time: 79137.13 Local Steps: 76000\n",
      "36.974346\n",
      "Train: Step:   191 Val-Loss: 2.0319  Val-Acc: 0.21 Time: 79637.98 Local Steps: 76400\n",
      "35.944756\n",
      "Train: Step:   192 Val-Loss: 1.9438  Val-Acc: 0.25 Time: 80042.75 Local Steps: 76800\n",
      "36.03508\n",
      "Train: Step:   193 Val-Loss: 1.9007  Val-Acc: 0.29 Time: 80491.65 Local Steps: 77200\n",
      "36.16488\n",
      "Train: Step:   194 Val-Loss: 1.8828  Val-Acc: 0.30 Time: 80886.01 Local Steps: 77600\n",
      "35.83332\n",
      "Train: Step:   195 Val-Loss: 1.9069  Val-Acc: 0.27 Time: 81390.64 Local Steps: 78000\n",
      "35.663532\n",
      "Train: Step:   196 Val-Loss: 1.9169  Val-Acc: 0.29 Time: 81846.16 Local Steps: 78400\n",
      "35.914085\n",
      "Train: Step:   197 Val-Loss: 1.9083  Val-Acc: 0.28 Time: 82313.92 Local Steps: 78800\n",
      "35.769733\n",
      "Train: Step:   198 Val-Loss: 1.9010  Val-Acc: 0.29 Time: 82592.16 Local Steps: 79200\n",
      "36.11457\n",
      "Train: Step:   199 Val-Loss: 1.9458  Val-Acc: 0.24 Time: 83017.92 Local Steps: 79600\n",
      "36.50506\n",
      "Train: Step:   200 Val-Loss: 1.9759  Val-Acc: 0.26 Time: 83418.10 Local Steps: 80000\n",
      "35.736065\n",
      "Train: Step:   201 Val-Loss: 1.9090  Val-Acc: 0.29 Time: 83846.84 Local Steps: 80400\n",
      "36.042534\n",
      "Train: Step:   202 Val-Loss: 1.9570  Val-Acc: 0.29 Time: 84292.46 Local Steps: 80800\n",
      "35.846443\n",
      "Train: Step:   203 Val-Loss: 1.9632  Val-Acc: 0.26 Time: 84739.49 Local Steps: 81200\n",
      "35.88919\n",
      "Train: Step:   204 Val-Loss: 1.9391  Val-Acc: 0.28 Time: 85137.33 Local Steps: 81600\n",
      "35.657936\n",
      "Train: Step:   205 Val-Loss: 1.9102  Val-Acc: 0.26 Time: 85593.07 Local Steps: 82000\n",
      "35.578\n",
      "Train: Step:   206 Val-Loss: 1.9037  Val-Acc: 0.29 Time: 85935.71 Local Steps: 82400\n",
      "35.69275\n",
      "Train: Step:   207 Val-Loss: 1.9545  Val-Acc: 0.27 Time: 86283.83 Local Steps: 82800\n",
      "35.646103\n",
      "Train: Step:   208 Val-Loss: 1.9218  Val-Acc: 0.28 Time: 86638.45 Local Steps: 83200\n",
      "36.50989\n",
      "Train: Step:   209 Val-Loss: 2.0421  Val-Acc: 0.20 Time: 87059.70 Local Steps: 83600\n",
      "35.883675\n",
      "Train: Step:   210 Val-Loss: 1.9634  Val-Acc: 0.26 Time: 87416.94 Local Steps: 84000\n",
      "35.54647\n",
      "Train: Step:   211 Val-Loss: 1.8798  Val-Acc: 0.30 Time: 87854.63 Local Steps: 84400\n",
      "35.539043\n",
      "Train: Step:   212 Val-Loss: 1.9049  Val-Acc: 0.29 Time: 88314.48 Local Steps: 84800\n",
      "35.649208\n",
      "Train: Step:   213 Val-Loss: 1.9243  Val-Acc: 0.27 Time: 88726.04 Local Steps: 85200\n",
      "35.706482\n",
      "Train: Step:   214 Val-Loss: 1.9229  Val-Acc: 0.26 Time: 89073.66 Local Steps: 85600\n",
      "35.51152\n",
      "Train: Step:   215 Val-Loss: 1.8791  Val-Acc: 0.29 Time: 89479.15 Local Steps: 86000\n",
      "36.14713\n",
      "Train: Step:   216 Val-Loss: 1.9524  Val-Acc: 0.23 Time: 89938.42 Local Steps: 86400\n",
      "35.471336\n",
      "Train: Step:   217 Val-Loss: 1.9094  Val-Acc: 0.26 Time: 90258.98 Local Steps: 86800\n",
      "35.958454\n",
      "Train: Step:   218 Val-Loss: 1.9900  Val-Acc: 0.22 Time: 90761.76 Local Steps: 87200\n",
      "35.10695\n",
      "Train: Step:   219 Val-Loss: 1.9192  Val-Acc: 0.27 Time: 91154.37 Local Steps: 87600\n",
      "34.942223\n",
      "Train: Step:   220 Val-Loss: 1.8929  Val-Acc: 0.30 Time: 91557.84 Local Steps: 88000\n",
      "35.259888\n",
      "Train: Step:   221 Val-Loss: 1.9118  Val-Acc: 0.27 Time: 91969.91 Local Steps: 88400\n",
      "35.24243\n",
      "Train: Step:   222 Val-Loss: 1.9738  Val-Acc: 0.23 Time: 92425.23 Local Steps: 88800\n",
      "35.190964\n",
      "Train: Step:   223 Val-Loss: 1.9739  Val-Acc: 0.27 Time: 92817.83 Local Steps: 89200\n",
      "35.4756\n",
      "Train: Step:   224 Val-Loss: 1.9707  Val-Acc: 0.26 Time: 93196.46 Local Steps: 89600\n",
      "35.547485\n",
      "Train: Step:   225 Val-Loss: 1.9722  Val-Acc: 0.27 Time: 93506.37 Local Steps: 90000\n",
      "35.46383\n",
      "Train: Step:   226 Val-Loss: 1.9860  Val-Acc: 0.26 Time: 93985.72 Local Steps: 90400\n",
      "35.658966\n",
      "Train: Step:   227 Val-Loss: 1.9292  Val-Acc: 0.26 Time: 94345.56 Local Steps: 90800\n",
      "35.3503\n",
      "Train: Step:   228 Val-Loss: 1.9484  Val-Acc: 0.27 Time: 94713.01 Local Steps: 91200\n",
      "35.030247\n",
      "Train: Step:   229 Val-Loss: 1.8760  Val-Acc: 0.30 Time: 95148.17 Local Steps: 91600\n",
      "34.935898\n",
      "Train: Step:   230 Val-Loss: 1.9020  Val-Acc: 0.31 Time: 95632.19 Local Steps: 92000\n",
      "35.104366\n",
      "Train: Step:   231 Val-Loss: 1.9110  Val-Acc: 0.28 Time: 96027.69 Local Steps: 92400\n",
      "35.3377\n",
      "Train: Step:   232 Val-Loss: 1.9046  Val-Acc: 0.31 Time: 96430.57 Local Steps: 92800\n",
      "35.219383\n",
      "Train: Step:   233 Val-Loss: 1.8773  Val-Acc: 0.30 Time: 96864.49 Local Steps: 93200\n",
      "35.14614\n",
      "Train: Step:   234 Val-Loss: 1.9020  Val-Acc: 0.27 Time: 97260.75 Local Steps: 93600\n",
      "34.881294\n",
      "Train: Step:   235 Val-Loss: 1.9234  Val-Acc: 0.31 Time: 97631.93 Local Steps: 94000\n",
      "35.421715\n",
      "Train: Step:   236 Val-Loss: 1.9562  Val-Acc: 0.30 Time: 98124.39 Local Steps: 94400\n",
      "35.16903\n",
      "Train: Step:   237 Val-Loss: 1.9631  Val-Acc: 0.27 Time: 98445.26 Local Steps: 94800\n",
      "35.22771\n",
      "Train: Step:   238 Val-Loss: 1.9910  Val-Acc: 0.26 Time: 98829.42 Local Steps: 95200\n",
      "34.894676\n",
      "Train: Step:   239 Val-Loss: 1.9533  Val-Acc: 0.29 Time: 99180.83 Local Steps: 95600\n",
      "34.747643\n",
      "Train: Step:   240 Val-Loss: 1.9316  Val-Acc: 0.30 Time: 99587.70 Local Steps: 96000\n",
      "35.19289\n",
      "Train: Step:   241 Val-Loss: 1.9806  Val-Acc: 0.26 Time: 99972.10 Local Steps: 96400\n",
      "34.751396\n",
      "Train: Step:   242 Val-Loss: 1.9330  Val-Acc: 0.28 Time: 100402.23 Local Steps: 96800\n",
      "Finished in 8931.34196472168\n",
      "--- FedBuff ---\n",
      "ResNetCifar(\n",
      "  (conv1): Conv2d_LUQ(3, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "  (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "  (relu): ReLU(inplace=True)\n",
      "  (layer1): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(16, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (layer2): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(16, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "      (downsample): Sequential(\n",
      "        (0): Conv2d_LUQ(16, 32, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "        (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      )\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (layer3): Sequential(\n",
      "    (0): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(32, 64, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "      (downsample): Sequential(\n",
      "        (0): Conv2d_LUQ(32, 64, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "        (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      )\n",
      "    )\n",
      "    (1): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "    (2): BasicBlock(\n",
      "      (conv1): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu1): ReLU()\n",
      "      (conv2): Conv2d_LUQ(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu2): ReLU()\n",
      "    )\n",
      "  )\n",
      "  (avgpool): AvgPool2d(kernel_size=8, stride=1, padding=0)\n",
      "  (fc): Linear(in_features=64, out_features=10, bias=True)\n",
      ")\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Client 1 is added to the population.\n",
      "Client 2 is added to the population.\n",
      "Client 3 is added to the population.\n",
      "Client 4 is added to the population.\n",
      "Client 5 is added to the population.\n",
      "Client 6 is added to the population.\n",
      "Client 7 is added to the population.\n",
      "Client 8 is added to the population.\n",
      "Client 9 is added to the population.\n",
      "Client 10 is added to the population.\n",
      "Client 11 is added to the population.\n",
      "Client 12 is added to the population.\n",
      "Client 13 is added to the population.\n",
      "Client 14 is added to the population.\n",
      "Client 15 is added to the population.\n",
      "Client 16 is added to the population.\n",
      "Client 17 is added to the population.\n",
      "Client 18 is added to the population.\n",
      "Client 19 is added to the population.\n",
      "Client 20 is added to the population.\n",
      "Client 21 is added to the population.\n",
      "Client 22 is added to the population.\n",
      "Client 23 is added to the population.\n",
      "Client 24 is added to the population.\n",
      "Client 25 is added to the population.\n",
      "Client 26 is added to the population.\n",
      "Client 27 is added to the population.\n",
      "Client 28 is added to the population.\n",
      "Client 29 is added to the population.\n",
      "Client 30 is added to the population.\n",
      "Client 31 is added to the population.\n",
      "Client 32 is added to the population.\n",
      "Client 33 is added to the population.\n",
      "Client 34 is added to the population.\n",
      "Client 35 is added to the population.\n",
      "Client 36 is added to the population.\n",
      "Client 37 is added to the population.\n",
      "Client 38 is added to the population.\n",
      "Client 39 is added to the population.\n",
      "Client 40 is added to the population.\n",
      "Client 41 is added to the population.\n",
      "Client 42 is added to the population.\n",
      "Client 43 is added to the population.\n",
      "Client 44 is added to the population.\n",
      "Client 45 is added to the population.\n",
      "Client 46 is added to the population.\n",
      "Client 47 is added to the population.\n",
      "Client 48 is added to the population.\n",
      "Client 49 is added to the population.\n",
      "Client 50 is added to the population.\n",
      "Client 51 is added to the population.\n",
      "Client 52 is added to the population.\n",
      "Client 53 is added to the population.\n",
      "Client 54 is added to the population.\n",
      "Client 55 is added to the population.\n",
      "Client 56 is added to the population.\n",
      "Client 57 is added to the population.\n",
      "Client 58 is added to the population.\n",
      "Client 59 is added to the population.\n",
      "Client 60 is added to the population.\n",
      "Client 61 is added to the population.\n",
      "Client 62 is added to the population.\n",
      "Client 63 is added to the population.\n",
      "Client 64 is added to the population.\n",
      "Client 65 is added to the population.\n",
      "Client 66 is added to the population.\n",
      "Client 67 is added to the population.\n",
      "Client 68 is added to the population.\n",
      "Client 69 is added to the population.\n",
      "Client 70 is added to the population.\n",
      "Client 71 is added to the population.\n",
      "Client 72 is added to the population.\n",
      "Client 73 is added to the population.\n",
      "Client 74 is added to the population.\n",
      "Client 75 is added to the population.\n",
      "Client 76 is added to the population.\n",
      "Client 77 is added to the population.\n",
      "Client 78 is added to the population.\n",
      "Client 79 is added to the population.\n",
      "Client 80 is added to the population.\n",
      "Client 81 is added to the population.\n",
      "Client 82 is added to the population.\n",
      "Client 83 is added to the population.\n",
      "Client 84 is added to the population.\n",
      "Client 85 is added to the population.\n",
      "Client 86 is added to the population.\n",
      "Client 87 is added to the population.\n",
      "Client 88 is added to the population.\n",
      "Client 89 is added to the population.\n",
      "Client 90 is added to the population.\n",
      "Client 91 is added to the population.\n",
      "Client 92 is added to the population.\n",
      "Client 93 is added to the population.\n",
      "Client 94 is added to the population.\n",
      "Client 95 is added to the population.\n",
      "Client 96 is added to the population.\n",
      "Client 97 is added to the population.\n",
      "Client 98 is added to the population.\n",
      "Client 99 is added to the population.\n",
      "Client 100 is added to the population.\n",
      "0.0\n",
      "Train: Step:     0 Val-Loss: 2.8170  Val-Acc: 0.10 Time:   0.00 Local Steps:     0\n",
      "39.083767\n",
      "Train: Step:   193 Val-Loss: 2.2263  Val-Acc: 0.17 Time: 1149.67 Local Steps: 40400\n",
      "38.884785\n",
      "Train: Step:   202 Val-Loss: 2.2454  Val-Acc: 0.17 Time: 1204.56 Local Steps: 42200\n",
      "40.808773\n",
      "Train: Step:   211 Val-Loss: 2.2640  Val-Acc: 0.17 Time: 1257.44 Local Steps: 44000\n",
      "40.182518\n",
      "Train: Step:   220 Val-Loss: 2.2170  Val-Acc: 0.14 Time: 1309.78 Local Steps: 45800\n",
      "38.655037\n",
      "Train: Step:   230 Val-Loss: 2.1959  Val-Acc: 0.19 Time: 1362.62 Local Steps: 47800\n",
      "39.138535\n",
      "Train: Step:   238 Val-Loss: 2.2119  Val-Acc: 0.16 Time: 1414.17 Local Steps: 49400\n",
      "41.37407\n",
      "Train: Step:   247 Val-Loss: 2.2890  Val-Acc: 0.14 Time: 1468.39 Local Steps: 51200\n",
      "39.13516\n",
      "Train: Step:   257 Val-Loss: 2.1839  Val-Acc: 0.20 Time: 1523.89 Local Steps: 53200\n",
      "39.767914\n",
      "Train: Step:   267 Val-Loss: 2.2203  Val-Acc: 0.17 Time: 1582.04 Local Steps: 55200\n",
      "39.33718\n",
      "Train: Step:   276 Val-Loss: 2.2027  Val-Acc: 0.19 Time: 1634.52 Local Steps: 57000\n",
      "39.02127\n",
      "Train: Step:   285 Val-Loss: 2.1259  Val-Acc: 0.22 Time: 1685.10 Local Steps: 58800\n",
      "39.991364\n",
      "Train: Step:   294 Val-Loss: 2.1615  Val-Acc: 0.21 Time: 1741.92 Local Steps: 60600\n",
      "39.46897\n",
      "Train: Step:   303 Val-Loss: 2.1282  Val-Acc: 0.23 Time: 1793.88 Local Steps: 62400\n",
      "40.075233\n",
      "Train: Step:   313 Val-Loss: 2.1738  Val-Acc: 0.16 Time: 1849.38 Local Steps: 64400\n",
      "39.14135\n",
      "Train: Step:   349 Val-Loss: 2.1572  Val-Acc: 0.21 Time: 2060.08 Local Steps: 71600\n",
      "39.06996\n",
      "Train: Step:   359 Val-Loss: 2.0981  Val-Acc: 0.22 Time: 2115.25 Local Steps: 73600\n",
      "41.850952\n",
      "Train: Step:   368 Val-Loss: 2.2034  Val-Acc: 0.11 Time: 2167.04 Local Steps: 75400\n",
      "40.53887\n",
      "Train: Step:   377 Val-Loss: 2.0916  Val-Acc: 0.21 Time: 2219.55 Local Steps: 77200\n",
      "39.95297\n",
      "Train: Step:   386 Val-Loss: 2.1555  Val-Acc: 0.20 Time: 2269.70 Local Steps: 79000\n",
      "38.53167\n",
      "Train: Step:   395 Val-Loss: 2.0891  Val-Acc: 0.22 Time: 2320.75 Local Steps: 80800\n",
      "39.869957\n",
      "Train: Step:   404 Val-Loss: 2.1113  Val-Acc: 0.20 Time: 2372.83 Local Steps: 82600\n",
      "39.76307\n",
      "Train: Step:   414 Val-Loss: 2.1111  Val-Acc: 0.23 Time: 2428.20 Local Steps: 84600\n",
      "40.028442\n",
      "Train: Step:   423 Val-Loss: 2.1612  Val-Acc: 0.15 Time: 2482.44 Local Steps: 86400\n",
      "40.64431\n",
      "Train: Step:   432 Val-Loss: 2.1021  Val-Acc: 0.20 Time: 2535.39 Local Steps: 88200\n",
      "41.33201\n",
      "Train: Step:   442 Val-Loss: 2.1404  Val-Acc: 0.21 Time: 2592.75 Local Steps: 90200\n",
      "39.564186\n",
      "Train: Step:   450 Val-Loss: 2.1260  Val-Acc: 0.19 Time: 2642.98 Local Steps: 91800\n",
      "39.589123\n",
      "Train: Step:   460 Val-Loss: 2.0704  Val-Acc: 0.22 Time: 2702.14 Local Steps: 93800\n",
      "38.793\n",
      "Train: Step:   470 Val-Loss: 2.0726  Val-Acc: 0.20 Time: 2756.00 Local Steps: 95800\n",
      "39.48873\n",
      "Train: Step:   479 Val-Loss: 2.1266  Val-Acc: 0.19 Time: 2807.41 Local Steps: 97600\n",
      "39.982258\n",
      "Train: Step:   487 Val-Loss: 2.0991  Val-Acc: 0.20 Time: 2857.60 Local Steps: 99200\n",
      "39.644688\n",
      "Train: Step:   496 Val-Loss: 2.0789  Val-Acc: 0.23 Time: 2910.48 Local Steps: 101000\n",
      "39.003426\n",
      "Train: Step:   505 Val-Loss: 2.0192  Val-Acc: 0.24 Time: 2961.46 Local Steps: 102800\n",
      "39.20479\n",
      "Train: Step:   514 Val-Loss: 2.1041  Val-Acc: 0.23 Time: 3015.47 Local Steps: 104600\n",
      "39.781517\n",
      "Train: Step:   523 Val-Loss: 2.1307  Val-Acc: 0.20 Time: 3070.73 Local Steps: 106400\n",
      "39.839787\n",
      "Train: Step:   532 Val-Loss: 2.0300  Val-Acc: 0.22 Time: 3121.51 Local Steps: 108200\n",
      "40.17656\n",
      "Train: Step:   541 Val-Loss: 2.0163  Val-Acc: 0.23 Time: 3173.99 Local Steps: 110000\n",
      "40.713203\n",
      "Train: Step:   551 Val-Loss: 2.1755  Val-Acc: 0.18 Time: 3227.49 Local Steps: 112000\n",
      "39.52884\n",
      "Train: Step:   560 Val-Loss: 2.0682  Val-Acc: 0.22 Time: 3283.89 Local Steps: 113800\n",
      "40.018436\n",
      "Train: Step:   569 Val-Loss: 2.0879  Val-Acc: 0.20 Time: 3339.88 Local Steps: 115600\n",
      "40.607914\n",
      "Train: Step:   578 Val-Loss: 2.0688  Val-Acc: 0.20 Time: 3390.78 Local Steps: 117400\n",
      "40.61828\n",
      "Train: Step:   587 Val-Loss: 2.0217  Val-Acc: 0.23 Time: 3442.47 Local Steps: 119200\n",
      "39.772648\n",
      "Train: Step:   596 Val-Loss: 2.0351  Val-Acc: 0.22 Time: 3494.16 Local Steps: 121000\n",
      "39.7343\n",
      "Train: Step:   605 Val-Loss: 2.0723  Val-Acc: 0.22 Time: 3545.23 Local Steps: 122800\n",
      "39.19566\n",
      "Train: Step:   613 Val-Loss: 2.0113  Val-Acc: 0.24 Time: 3595.89 Local Steps: 124400\n",
      "40.5016\n",
      "Train: Step:   621 Val-Loss: 2.0951  Val-Acc: 0.18 Time: 3645.98 Local Steps: 126000\n",
      "38.572342\n",
      "Train: Step:   631 Val-Loss: 2.0098  Val-Acc: 0.24 Time: 3697.59 Local Steps: 128000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "39.464546\n",
      "Train: Step:   639 Val-Loss: 2.0470  Val-Acc: 0.24 Time: 3748.57 Local Steps: 129600\n",
      "38.617306\n",
      "Train: Step:   648 Val-Loss: 2.0523  Val-Acc: 0.21 Time: 3800.70 Local Steps: 131400\n",
      "38.73533\n",
      "Train: Step:   657 Val-Loss: 2.0455  Val-Acc: 0.21 Time: 3851.90 Local Steps: 133200\n",
      "39.588623\n",
      "Train: Step:   666 Val-Loss: 2.0188  Val-Acc: 0.23 Time: 3905.69 Local Steps: 135000\n",
      "39.60977\n",
      "Train: Step:   675 Val-Loss: 2.0886  Val-Acc: 0.21 Time: 3957.70 Local Steps: 136800\n",
      "39.177288\n",
      "Train: Step:   685 Val-Loss: 2.0076  Val-Acc: 0.23 Time: 4013.06 Local Steps: 138800\n",
      "39.809372\n",
      "Train: Step:   694 Val-Loss: 2.0890  Val-Acc: 0.19 Time: 4068.55 Local Steps: 140600\n",
      "39.280922\n",
      "Train: Step:   703 Val-Loss: 1.9983  Val-Acc: 0.21 Time: 4122.10 Local Steps: 142400\n",
      "40.028786\n",
      "Train: Step:   712 Val-Loss: 2.1009  Val-Acc: 0.20 Time: 4176.21 Local Steps: 144200\n",
      "38.444855\n",
      "Train: Step:   722 Val-Loss: 2.0144  Val-Acc: 0.24 Time: 4232.66 Local Steps: 146200\n",
      "39.87498\n",
      "Train: Step:   732 Val-Loss: 2.0011  Val-Acc: 0.25 Time: 4285.56 Local Steps: 148200\n",
      "38.903816\n",
      "Train: Step:   741 Val-Loss: 2.0173  Val-Acc: 0.23 Time: 4339.62 Local Steps: 150000\n",
      "38.46601\n",
      "Train: Step:   750 Val-Loss: 2.0308  Val-Acc: 0.23 Time: 4395.12 Local Steps: 151800\n",
      "40.355804\n",
      "Train: Step:   759 Val-Loss: 2.0653  Val-Acc: 0.19 Time: 4449.63 Local Steps: 153600\n",
      "39.67882\n",
      "Train: Step:   768 Val-Loss: 2.0297  Val-Acc: 0.22 Time: 4502.98 Local Steps: 155400\n",
      "39.217926\n",
      "Train: Step:   777 Val-Loss: 2.0794  Val-Acc: 0.21 Time: 4553.14 Local Steps: 157200\n",
      "38.260445\n",
      "Train: Step:   786 Val-Loss: 1.9886  Val-Acc: 0.26 Time: 4606.95 Local Steps: 159000\n",
      "39.069954\n",
      "Train: Step:   795 Val-Loss: 2.0067  Val-Acc: 0.24 Time: 4658.53 Local Steps: 160800\n",
      "39.451103\n",
      "Train: Step:   804 Val-Loss: 1.9912  Val-Acc: 0.22 Time: 4710.50 Local Steps: 162600\n",
      "38.453506\n",
      "Train: Step:   813 Val-Loss: 1.9788  Val-Acc: 0.24 Time: 4763.00 Local Steps: 164400\n",
      "39.387222\n",
      "Train: Step:   822 Val-Loss: 2.1055  Val-Acc: 0.22 Time: 4813.77 Local Steps: 166200\n",
      "39.427734\n",
      "Train: Step:   831 Val-Loss: 1.9793  Val-Acc: 0.23 Time: 4866.53 Local Steps: 168000\n",
      "39.159462\n",
      "Train: Step:   840 Val-Loss: 2.0639  Val-Acc: 0.23 Time: 4918.76 Local Steps: 169800\n",
      "40.477295\n",
      "Train: Step:   850 Val-Loss: 2.0950  Val-Acc: 0.21 Time: 4977.75 Local Steps: 171800\n",
      "38.595127\n",
      "Train: Step:   859 Val-Loss: 1.9931  Val-Acc: 0.23 Time: 5030.15 Local Steps: 173600\n",
      "39.38768\n",
      "Train: Step:   868 Val-Loss: 2.0379  Val-Acc: 0.21 Time: 5082.80 Local Steps: 175400\n",
      "39.621147\n",
      "Train: Step:   877 Val-Loss: 2.1073  Val-Acc: 0.19 Time: 5133.36 Local Steps: 177200\n",
      "39.560455\n",
      "Train: Step:   886 Val-Loss: 2.0028  Val-Acc: 0.26 Time: 5187.74 Local Steps: 179000\n",
      "39.4135\n",
      "Train: Step:   895 Val-Loss: 2.0301  Val-Acc: 0.20 Time: 5242.92 Local Steps: 180800\n",
      "38.648582\n",
      "Train: Step:   903 Val-Loss: 1.9723  Val-Acc: 0.24 Time: 5294.11 Local Steps: 182400\n",
      "38.814964\n",
      "Train: Step:   913 Val-Loss: 2.0145  Val-Acc: 0.26 Time: 5351.32 Local Steps: 184400\n",
      "38.800835\n",
      "Train: Step:   922 Val-Loss: 2.0057  Val-Acc: 0.23 Time: 5402.94 Local Steps: 186200\n",
      "38.149723\n",
      "Train: Step:   931 Val-Loss: 1.9498  Val-Acc: 0.26 Time: 5457.15 Local Steps: 188000\n",
      "38.37191\n",
      "Train: Step:   941 Val-Loss: 2.0086  Val-Acc: 0.24 Time: 5511.39 Local Steps: 190000\n",
      "38.915794\n",
      "Train: Step:   950 Val-Loss: 1.9953  Val-Acc: 0.25 Time: 5565.54 Local Steps: 191800\n",
      "38.48045\n",
      "Train: Step:   959 Val-Loss: 1.9638  Val-Acc: 0.25 Time: 5617.66 Local Steps: 193600\n",
      "39.10276\n",
      "Train: Step:   968 Val-Loss: 2.0495  Val-Acc: 0.23 Time: 5671.33 Local Steps: 195400\n",
      "38.86866\n",
      "Train: Step:   978 Val-Loss: 2.0203  Val-Acc: 0.21 Time: 5725.24 Local Steps: 197400\n",
      "39.13246\n",
      "Train: Step:   987 Val-Loss: 1.9923  Val-Acc: 0.24 Time: 5778.04 Local Steps: 199200\n",
      "39.939667\n",
      "Train: Step:   996 Val-Loss: 1.9628  Val-Acc: 0.27 Time: 5830.15 Local Steps: 201000\n",
      "39.446323\n",
      "Train: Step:  1005 Val-Loss: 2.0949  Val-Acc: 0.20 Time: 5880.56 Local Steps: 202800\n",
      "39.10642\n",
      "Train: Step:  1014 Val-Loss: 1.9814  Val-Acc: 0.26 Time: 5935.40 Local Steps: 204600\n",
      "40.485107\n",
      "Train: Step:  1023 Val-Loss: 2.0159  Val-Acc: 0.21 Time: 5987.86 Local Steps: 206400\n",
      "40.89125\n",
      "Train: Step:  1032 Val-Loss: 2.0284  Val-Acc: 0.22 Time: 6045.40 Local Steps: 208200\n",
      "39.507164\n",
      "Train: Step:  1042 Val-Loss: 1.9665  Val-Acc: 0.28 Time: 6099.04 Local Steps: 210200\n",
      "38.260704\n",
      "Train: Step:  1052 Val-Loss: 1.9798  Val-Acc: 0.24 Time: 6154.54 Local Steps: 212200\n",
      "39.42672\n",
      "Train: Step:  1061 Val-Loss: 2.0272  Val-Acc: 0.23 Time: 6209.15 Local Steps: 214000\n",
      "38.608833\n",
      "Train: Step:  1070 Val-Loss: 1.9664  Val-Acc: 0.25 Time: 6260.93 Local Steps: 215800\n",
      "38.517494\n",
      "Train: Step:  1079 Val-Loss: 1.9631  Val-Acc: 0.24 Time: 6317.55 Local Steps: 217600\n",
      "37.624653\n",
      "Train: Step:  1088 Val-Loss: 1.9377  Val-Acc: 0.26 Time: 6367.95 Local Steps: 219400\n",
      "38.214752\n",
      "Train: Step:  1097 Val-Loss: 1.9443  Val-Acc: 0.26 Time: 6420.72 Local Steps: 221200\n",
      "39.457413\n",
      "Train: Step:  1107 Val-Loss: 1.9678  Val-Acc: 0.27 Time: 6477.19 Local Steps: 223200\n",
      "38.67372\n",
      "Train: Step:  1116 Val-Loss: 1.9971  Val-Acc: 0.25 Time: 6527.94 Local Steps: 225000\n",
      "37.859676\n",
      "Train: Step:  1124 Val-Loss: 1.9782  Val-Acc: 0.24 Time: 6579.03 Local Steps: 226600\n",
      "38.489105\n",
      "Train: Step:  1132 Val-Loss: 1.9668  Val-Acc: 0.22 Time: 6629.96 Local Steps: 228200\n",
      "39.065117\n",
      "Train: Step:  1141 Val-Loss: 2.0205  Val-Acc: 0.21 Time: 6681.85 Local Steps: 230000\n",
      "38.36035\n",
      "Train: Step:  1150 Val-Loss: 1.9802  Val-Acc: 0.26 Time: 6733.78 Local Steps: 231800\n",
      "37.827087\n",
      "Train: Step:  1159 Val-Loss: 1.9461  Val-Acc: 0.27 Time: 6786.46 Local Steps: 233600\n",
      "38.70591\n",
      "Train: Step:  1168 Val-Loss: 1.9452  Val-Acc: 0.23 Time: 6836.48 Local Steps: 235400\n",
      "38.22151\n",
      "Train: Step:  1177 Val-Loss: 1.9982  Val-Acc: 0.24 Time: 6887.57 Local Steps: 237200\n",
      "39.002563\n",
      "Train: Step:  1186 Val-Loss: 2.0133  Val-Acc: 0.20 Time: 6938.78 Local Steps: 239000\n",
      "38.28636\n",
      "Train: Step:  1195 Val-Loss: 1.9645  Val-Acc: 0.24 Time: 6990.03 Local Steps: 240800\n",
      "37.706196\n",
      "Train: Step:  1204 Val-Loss: 1.9700  Val-Acc: 0.25 Time: 7045.34 Local Steps: 242600\n",
      "38.498066\n",
      "Train: Step:  1213 Val-Loss: 1.9187  Val-Acc: 0.29 Time: 7095.98 Local Steps: 244400\n",
      "39.9143\n",
      "Train: Step:  1222 Val-Loss: 1.9984  Val-Acc: 0.22 Time: 7147.03 Local Steps: 246200\n",
      "38.811905\n",
      "Train: Step:  1230 Val-Loss: 2.0015  Val-Acc: 0.23 Time: 7197.77 Local Steps: 247800\n",
      "38.241295\n",
      "Train: Step:  1239 Val-Loss: 1.9473  Val-Acc: 0.26 Time: 7252.06 Local Steps: 249600\n",
      "38.35887\n",
      "Train: Step:  1248 Val-Loss: 1.9353  Val-Acc: 0.28 Time: 7303.89 Local Steps: 251400\n",
      "37.84926\n",
      "Train: Step:  1257 Val-Loss: 1.9261  Val-Acc: 0.27 Time: 7357.16 Local Steps: 253200\n",
      "40.041466\n",
      "Train: Step:  1266 Val-Loss: 2.0235  Val-Acc: 0.25 Time: 7414.10 Local Steps: 255000\n",
      "39.168938\n",
      "Train: Step:  1276 Val-Loss: 2.0577  Val-Acc: 0.22 Time: 7470.40 Local Steps: 257000\n",
      "37.606873\n",
      "Train: Step:  1285 Val-Loss: 1.9080  Val-Acc: 0.26 Time: 7523.83 Local Steps: 258800\n",
      "38.77687\n",
      "Train: Step:  1293 Val-Loss: 1.9731  Val-Acc: 0.24 Time: 7574.32 Local Steps: 260400\n",
      "37.989555\n",
      "Train: Step:  1302 Val-Loss: 1.9508  Val-Acc: 0.25 Time: 7626.23 Local Steps: 262200\n",
      "38.206276\n",
      "Train: Step:  1311 Val-Loss: 1.9482  Val-Acc: 0.28 Time: 7679.46 Local Steps: 264000\n",
      "38.13543\n",
      "Train: Step:  1321 Val-Loss: 1.9593  Val-Acc: 0.25 Time: 7737.03 Local Steps: 266000\n",
      "38.831512\n",
      "Train: Step:  1330 Val-Loss: 1.9822  Val-Acc: 0.27 Time: 7790.67 Local Steps: 267800\n",
      "38.135334\n",
      "Train: Step:  1339 Val-Loss: 1.9095  Val-Acc: 0.25 Time: 7842.40 Local Steps: 269600\n",
      "38.970528\n",
      "Train: Step:  1348 Val-Loss: 1.9577  Val-Acc: 0.24 Time: 7893.79 Local Steps: 271400\n",
      "37.80757\n",
      "Train: Step:  1357 Val-Loss: 1.9676  Val-Acc: 0.24 Time: 7946.95 Local Steps: 273200\n",
      "37.768726\n",
      "Train: Step:  1366 Val-Loss: 1.9140  Val-Acc: 0.28 Time: 8003.23 Local Steps: 275000\n",
      "37.912464\n",
      "Train: Step:  1375 Val-Loss: 1.9866  Val-Acc: 0.23 Time: 8054.85 Local Steps: 276800\n",
      "38.261036\n",
      "Train: Step:  1384 Val-Loss: 1.9374  Val-Acc: 0.26 Time: 8104.94 Local Steps: 278600\n",
      "38.668556\n",
      "Train: Step:  1393 Val-Loss: 1.9738  Val-Acc: 0.25 Time: 8158.82 Local Steps: 280400\n",
      "39.14815\n",
      "Train: Step:  1402 Val-Loss: 1.9535  Val-Acc: 0.25 Time: 8212.20 Local Steps: 282200\n",
      "37.451935\n",
      "Train: Step:  1412 Val-Loss: 1.9449  Val-Acc: 0.28 Time: 8270.19 Local Steps: 284200\n",
      "37.298275\n",
      "Train: Step:  1422 Val-Loss: 1.9213  Val-Acc: 0.28 Time: 8326.17 Local Steps: 286200\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "38.68475\n",
      "Train: Step:  1431 Val-Loss: 1.9929  Val-Acc: 0.22 Time: 8379.52 Local Steps: 288000\n",
      "39.41919\n",
      "Train: Step:  1440 Val-Loss: 1.9558  Val-Acc: 0.27 Time: 8433.42 Local Steps: 289800\n",
      "37.47828\n",
      "Train: Step:  1450 Val-Loss: 1.9310  Val-Acc: 0.25 Time: 8489.33 Local Steps: 291800\n",
      "38.483162\n",
      "Train: Step:  1460 Val-Loss: 1.9618  Val-Acc: 0.26 Time: 8546.28 Local Steps: 293800\n",
      "38.38379\n",
      "Train: Step:  1469 Val-Loss: 1.9465  Val-Acc: 0.27 Time: 8599.70 Local Steps: 295600\n",
      "37.68551\n",
      "Train: Step:  1478 Val-Loss: 1.9670  Val-Acc: 0.24 Time: 8650.33 Local Steps: 297400\n",
      "38.46084\n",
      "Train: Step:  1488 Val-Loss: 1.9091  Val-Acc: 0.27 Time: 8704.44 Local Steps: 299400\n",
      "38.2721\n",
      "Train: Step:  1497 Val-Loss: 1.9594  Val-Acc: 0.28 Time: 8758.57 Local Steps: 301200\n",
      "39.272217\n",
      "Train: Step:  1506 Val-Loss: 2.1796  Val-Acc: 0.20 Time: 8811.34 Local Steps: 303000\n",
      "38.32669\n",
      "Train: Step:  1516 Val-Loss: 1.9127  Val-Acc: 0.29 Time: 8869.71 Local Steps: 305000\n",
      "38.17087\n",
      "Train: Step:  1525 Val-Loss: 1.9259  Val-Acc: 0.27 Time: 8921.59 Local Steps: 306800\n",
      "37.855747\n",
      "Train: Step:  1534 Val-Loss: 1.9339  Val-Acc: 0.25 Time: 8971.99 Local Steps: 308600\n",
      "38.169743\n",
      "Train: Step:  1543 Val-Loss: 2.0222  Val-Acc: 0.23 Time: 9026.88 Local Steps: 310400\n",
      "38.637276\n",
      "Train: Step:  1553 Val-Loss: 2.0724  Val-Acc: 0.20 Time: 9078.46 Local Steps: 312400\n",
      "38.57206\n",
      "Train: Step:  1562 Val-Loss: 1.9293  Val-Acc: 0.27 Time: 9134.82 Local Steps: 314200\n",
      "37.142303\n",
      "Train: Step:  1571 Val-Loss: 1.8925  Val-Acc: 0.29 Time: 9188.19 Local Steps: 316000\n",
      "38.67695\n",
      "Train: Step:  1580 Val-Loss: 1.9224  Val-Acc: 0.26 Time: 9238.65 Local Steps: 317800\n",
      "38.42344\n",
      "Train: Step:  1590 Val-Loss: 2.0001  Val-Acc: 0.26 Time: 9297.50 Local Steps: 319800\n",
      "36.744034\n",
      "Train: Step:  1599 Val-Loss: 1.9023  Val-Acc: 0.27 Time: 9347.67 Local Steps: 321600\n",
      "37.548542\n",
      "Train: Step:  1608 Val-Loss: 1.9697  Val-Acc: 0.24 Time: 9400.18 Local Steps: 323400\n",
      "37.107533\n",
      "Train: Step:  1616 Val-Loss: 1.9953  Val-Acc: 0.24 Time: 9451.16 Local Steps: 325000\n",
      "38.488724\n",
      "Train: Step:  1625 Val-Loss: 1.9835  Val-Acc: 0.22 Time: 9503.16 Local Steps: 326800\n",
      "38.16497\n",
      "Train: Step:  1635 Val-Loss: 2.0747  Val-Acc: 0.23 Time: 9559.07 Local Steps: 328800\n",
      "37.71006\n",
      "Train: Step:  1644 Val-Loss: 1.9718  Val-Acc: 0.23 Time: 9611.92 Local Steps: 330600\n",
      "39.25559\n",
      "Train: Step:  1653 Val-Loss: 2.0324  Val-Acc: 0.19 Time: 9662.33 Local Steps: 332400\n",
      "38.382828\n",
      "Train: Step:  1661 Val-Loss: 1.9368  Val-Acc: 0.26 Time: 9712.95 Local Steps: 334000\n",
      "37.692017\n",
      "Train: Step:  1670 Val-Loss: 1.9564  Val-Acc: 0.24 Time: 9765.87 Local Steps: 335800\n",
      "37.590332\n",
      "Train: Step:  1679 Val-Loss: 1.9320  Val-Acc: 0.25 Time: 9817.66 Local Steps: 337600\n",
      "38.169296\n",
      "Train: Step:  1688 Val-Loss: 1.9680  Val-Acc: 0.25 Time: 9869.94 Local Steps: 339400\n",
      "37.220497\n",
      "Train: Step:  1697 Val-Loss: 1.9351  Val-Acc: 0.27 Time: 9921.92 Local Steps: 341200\n",
      "38.33499\n",
      "Train: Step:  1706 Val-Loss: 1.9421  Val-Acc: 0.25 Time: 9974.78 Local Steps: 343000\n",
      "37.026768\n",
      "Train: Step:  1714 Val-Loss: 1.9360  Val-Acc: 0.27 Time: 10025.59 Local Steps: 344600\n",
      "37.41153\n",
      "Train: Step:  1723 Val-Loss: 1.9475  Val-Acc: 0.25 Time: 10077.83 Local Steps: 346400\n",
      "38.356815\n",
      "Train: Step:  1733 Val-Loss: 1.9544  Val-Acc: 0.25 Time: 10133.36 Local Steps: 348400\n",
      "37.642696\n",
      "Train: Step:  1742 Val-Loss: 1.8702  Val-Acc: 0.29 Time: 10186.64 Local Steps: 350200\n",
      "38.171524\n",
      "Train: Step:  1751 Val-Loss: 1.9305  Val-Acc: 0.27 Time: 10238.41 Local Steps: 352000\n",
      "37.59569\n",
      "Train: Step:  1760 Val-Loss: 1.9458  Val-Acc: 0.27 Time: 10290.45 Local Steps: 353800\n",
      "38.06812\n",
      "Train: Step:  1769 Val-Loss: 2.0154  Val-Acc: 0.22 Time: 10342.14 Local Steps: 355600\n",
      "36.953793\n",
      "Train: Step:  1778 Val-Loss: 1.9830  Val-Acc: 0.24 Time: 10399.29 Local Steps: 357400\n",
      "37.96675\n",
      "Train: Step:  1788 Val-Loss: 1.9609  Val-Acc: 0.27 Time: 10453.61 Local Steps: 359400\n",
      "37.163044\n",
      "Train: Step:  1797 Val-Loss: 1.9706  Val-Acc: 0.21 Time: 10505.11 Local Steps: 361200\n",
      "37.11985\n",
      "Train: Step:  1806 Val-Loss: 1.9066  Val-Acc: 0.27 Time: 10557.50 Local Steps: 363000\n",
      "36.99572\n",
      "Train: Step:  1815 Val-Loss: 1.8802  Val-Acc: 0.25 Time: 10614.61 Local Steps: 364800\n",
      "37.572426\n",
      "Train: Step:  1824 Val-Loss: 1.9538  Val-Acc: 0.25 Time: 10664.98 Local Steps: 366600\n",
      "37.675446\n",
      "Train: Step:  1833 Val-Loss: 2.0049  Val-Acc: 0.18 Time: 10717.32 Local Steps: 368400\n",
      "38.34584\n",
      "Train: Step:  1842 Val-Loss: 2.0202  Val-Acc: 0.21 Time: 10769.69 Local Steps: 370200\n",
      "37.819107\n",
      "Train: Step:  1851 Val-Loss: 1.9399  Val-Acc: 0.27 Time: 10830.36 Local Steps: 372000\n",
      "37.50802\n",
      "Train: Step:  1861 Val-Loss: 1.9309  Val-Acc: 0.26 Time: 10881.13 Local Steps: 374000\n",
      "37.506573\n",
      "Train: Step:  1870 Val-Loss: 1.9672  Val-Acc: 0.24 Time: 10936.03 Local Steps: 375800\n",
      "37.082565\n",
      "Train: Step:  1879 Val-Loss: 1.9403  Val-Acc: 0.25 Time: 10990.43 Local Steps: 377600\n",
      "37.729935\n",
      "Train: Step:  1888 Val-Loss: 1.9577  Val-Acc: 0.26 Time: 11045.88 Local Steps: 379400\n",
      "37.081398\n",
      "Train: Step:  1897 Val-Loss: 1.9275  Val-Acc: 0.26 Time: 11096.16 Local Steps: 381200\n",
      "37.25057\n",
      "Train: Step:  1906 Val-Loss: 1.9069  Val-Acc: 0.27 Time: 11149.47 Local Steps: 383000\n",
      "38.404793\n",
      "Train: Step:  1915 Val-Loss: 1.9858  Val-Acc: 0.25 Time: 11202.46 Local Steps: 384800\n",
      "37.60276\n",
      "Train: Step:  1924 Val-Loss: 1.9677  Val-Acc: 0.27 Time: 11259.22 Local Steps: 386600\n",
      "37.76519\n",
      "Train: Step:  1933 Val-Loss: 2.0015  Val-Acc: 0.25 Time: 11310.33 Local Steps: 388400\n",
      "36.94118\n",
      "Train: Step:  1942 Val-Loss: 1.9091  Val-Acc: 0.28 Time: 11362.93 Local Steps: 390200\n",
      "37.600643\n",
      "Train: Step:  1951 Val-Loss: 1.9785  Val-Acc: 0.24 Time: 11415.00 Local Steps: 392000\n",
      "36.212234\n",
      "Train: Step:  1961 Val-Loss: 1.8728  Val-Acc: 0.29 Time: 11468.19 Local Steps: 394000\n",
      "38.139145\n",
      "Train: Step:  1969 Val-Loss: 1.9188  Val-Acc: 0.26 Time: 11521.99 Local Steps: 395600\n",
      "37.661545\n",
      "Train: Step:  1978 Val-Loss: 1.9968  Val-Acc: 0.26 Time: 11572.12 Local Steps: 397400\n",
      "38.24334\n",
      "Train: Step:  1986 Val-Loss: 2.0253  Val-Acc: 0.22 Time: 11622.37 Local Steps: 399000\n",
      "36.686714\n",
      "Train: Step:  1995 Val-Loss: 1.9860  Val-Acc: 0.25 Time: 11674.96 Local Steps: 400800\n",
      "36.880966\n",
      "Train: Step:  2005 Val-Loss: 1.9108  Val-Acc: 0.27 Time: 11731.31 Local Steps: 402800\n",
      "38.70329\n",
      "Train: Step:  2015 Val-Loss: 2.0572  Val-Acc: 0.21 Time: 11788.79 Local Steps: 404800\n",
      "36.557518\n",
      "Train: Step:  2023 Val-Loss: 1.8569  Val-Acc: 0.29 Time: 11840.07 Local Steps: 406400\n",
      "37.29663\n",
      "Train: Step:  2033 Val-Loss: 2.0319  Val-Acc: 0.22 Time: 11895.13 Local Steps: 408400\n",
      "37.04309\n",
      "Train: Step:  2042 Val-Loss: 1.9453  Val-Acc: 0.26 Time: 11946.21 Local Steps: 410200\n",
      "36.61104\n",
      "Train: Step:  2051 Val-Loss: 1.9257  Val-Acc: 0.25 Time: 11996.44 Local Steps: 412000\n",
      "36.78673\n",
      "Train: Step:  2060 Val-Loss: 1.9289  Val-Acc: 0.27 Time: 12047.04 Local Steps: 413800\n",
      "37.814495\n",
      "Train: Step:  2069 Val-Loss: 1.9542  Val-Acc: 0.25 Time: 12100.44 Local Steps: 415600\n",
      "37.292892\n",
      "Train: Step:  2078 Val-Loss: 2.0136  Val-Acc: 0.25 Time: 12153.02 Local Steps: 417400\n",
      "36.64689\n",
      "Train: Step:  2087 Val-Loss: 1.8742  Val-Acc: 0.27 Time: 12210.26 Local Steps: 419200\n",
      "36.43277\n",
      "Train: Step:  2096 Val-Loss: 1.9264  Val-Acc: 0.25 Time: 12262.52 Local Steps: 421000\n",
      "37.11134\n",
      "Train: Step:  2105 Val-Loss: 1.9591  Val-Acc: 0.24 Time: 12312.77 Local Steps: 422800\n",
      "36.617493\n",
      "Train: Step:  2113 Val-Loss: 1.9032  Val-Acc: 0.26 Time: 12362.80 Local Steps: 424400\n",
      "35.9821\n",
      "Train: Step:  2122 Val-Loss: 1.8923  Val-Acc: 0.31 Time: 12415.14 Local Steps: 426200\n",
      "37.635315\n",
      "Train: Step:  2132 Val-Loss: 2.0956  Val-Acc: 0.25 Time: 12472.59 Local Steps: 428200\n",
      "37.048813\n",
      "Train: Step:  2141 Val-Loss: 2.0303  Val-Acc: 0.24 Time: 12522.85 Local Steps: 430000\n",
      "35.89527\n",
      "Train: Step:  2150 Val-Loss: 1.8686  Val-Acc: 0.29 Time: 12575.98 Local Steps: 431800\n",
      "37.409416\n",
      "Train: Step:  2159 Val-Loss: 1.9897  Val-Acc: 0.24 Time: 12630.03 Local Steps: 433600\n",
      "36.06067\n",
      "Train: Step:  2169 Val-Loss: 1.9190  Val-Acc: 0.28 Time: 12683.15 Local Steps: 435600\n",
      "37.37638\n",
      "Train: Step:  2178 Val-Loss: 1.8884  Val-Acc: 0.27 Time: 12741.55 Local Steps: 437400\n",
      "36.86061\n",
      "Train: Step:  2187 Val-Loss: 1.9781  Val-Acc: 0.21 Time: 12795.90 Local Steps: 439200\n",
      "36.762726\n",
      "Train: Step:  2197 Val-Loss: 1.9263  Val-Acc: 0.26 Time: 12853.13 Local Steps: 441200\n",
      "36.31259\n",
      "Train: Step:  2206 Val-Loss: 1.9337  Val-Acc: 0.28 Time: 12903.80 Local Steps: 443000\n",
      "35.83281\n",
      "Train: Step:  2216 Val-Loss: 1.8879  Val-Acc: 0.29 Time: 12959.58 Local Steps: 445000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36.663883\n",
      "Train: Step:  2225 Val-Loss: 1.8952  Val-Acc: 0.28 Time: 13014.38 Local Steps: 446800\n",
      "38.05381\n",
      "Train: Step:  2234 Val-Loss: 1.9739  Val-Acc: 0.23 Time: 13067.76 Local Steps: 448600\n",
      "36.931664\n",
      "Train: Step:  2243 Val-Loss: 1.9126  Val-Acc: 0.24 Time: 13122.15 Local Steps: 450400\n",
      "35.624466\n",
      "Train: Step:  2252 Val-Loss: 1.9297  Val-Acc: 0.28 Time: 13175.67 Local Steps: 452200\n",
      "36.947388\n",
      "Train: Step:  2261 Val-Loss: 2.0069  Val-Acc: 0.25 Time: 13229.72 Local Steps: 454000\n",
      "36.5383\n",
      "Train: Step:  2270 Val-Loss: 1.9087  Val-Acc: 0.25 Time: 13283.85 Local Steps: 455800\n",
      "36.26165\n",
      "Train: Step:  2280 Val-Loss: 1.9343  Val-Acc: 0.25 Time: 13337.71 Local Steps: 457800\n",
      "37.5254\n",
      "Train: Step:  2289 Val-Loss: 1.9202  Val-Acc: 0.28 Time: 13392.91 Local Steps: 459600\n",
      "35.523663\n",
      "Train: Step:  2299 Val-Loss: 1.8543  Val-Acc: 0.31 Time: 13446.16 Local Steps: 461600\n",
      "37.051476\n",
      "Train: Step:  2308 Val-Loss: 1.9329  Val-Acc: 0.25 Time: 13499.61 Local Steps: 463400\n",
      "35.970367\n",
      "Train: Step:  2317 Val-Loss: 1.8760  Val-Acc: 0.29 Time: 13552.19 Local Steps: 465200\n",
      "37.08838\n",
      "Train: Step:  2326 Val-Loss: 1.9759  Val-Acc: 0.26 Time: 13608.95 Local Steps: 467000\n",
      "35.973095\n",
      "Train: Step:  2335 Val-Loss: 1.9131  Val-Acc: 0.26 Time: 13660.08 Local Steps: 468800\n",
      "35.48503\n",
      "Train: Step:  2345 Val-Loss: 1.9079  Val-Acc: 0.26 Time: 13716.62 Local Steps: 470800\n",
      "37.299194\n",
      "Train: Step:  2354 Val-Loss: 1.9376  Val-Acc: 0.25 Time: 13770.04 Local Steps: 472600\n",
      "38.101597\n",
      "Train: Step:  2363 Val-Loss: 1.9866  Val-Acc: 0.21 Time: 13822.18 Local Steps: 474400\n",
      "36.58397\n",
      "Train: Step:  2372 Val-Loss: 1.9366  Val-Acc: 0.21 Time: 13874.48 Local Steps: 476200\n",
      "37.587402\n",
      "Train: Step:  2381 Val-Loss: 2.0758  Val-Acc: 0.14 Time: 13928.75 Local Steps: 478000\n",
      "35.845413\n",
      "Train: Step:  2390 Val-Loss: 1.9102  Val-Acc: 0.26 Time: 13980.14 Local Steps: 479800\n",
      "36.263702\n",
      "Train: Step:  2399 Val-Loss: 1.9148  Val-Acc: 0.27 Time: 14031.50 Local Steps: 481600\n",
      "36.534016\n",
      "Train: Step:  2407 Val-Loss: 1.9205  Val-Acc: 0.23 Time: 14084.23 Local Steps: 483200\n",
      "35.9529\n",
      "Train: Step:  2417 Val-Loss: 1.8878  Val-Acc: 0.28 Time: 14139.68 Local Steps: 485200\n",
      "36.750664\n",
      "Train: Step:  2425 Val-Loss: 1.9381  Val-Acc: 0.26 Time: 14190.62 Local Steps: 486800\n",
      "37.964695\n",
      "Train: Step:  2434 Val-Loss: 1.9592  Val-Acc: 0.22 Time: 14241.75 Local Steps: 488600\n",
      "36.35576\n",
      "Train: Step:  2443 Val-Loss: 2.0083  Val-Acc: 0.24 Time: 14292.77 Local Steps: 490400\n",
      "36.860126\n",
      "Train: Step:  2452 Val-Loss: 2.0148  Val-Acc: 0.23 Time: 14345.38 Local Steps: 492200\n",
      "36.14509\n",
      "Train: Step:  2461 Val-Loss: 1.8654  Val-Acc: 0.28 Time: 14402.30 Local Steps: 494000\n",
      "37.742012\n",
      "Train: Step:  2471 Val-Loss: 1.9707  Val-Acc: 0.24 Time: 14454.67 Local Steps: 496000\n",
      "36.58567\n",
      "Train: Step:  2480 Val-Loss: 1.9645  Val-Acc: 0.28 Time: 14508.56 Local Steps: 497800\n",
      "35.740486\n",
      "Train: Step:  2490 Val-Loss: 1.9278  Val-Acc: 0.28 Time: 14563.66 Local Steps: 499800\n",
      "35.72534\n",
      "Train: Step:  2499 Val-Loss: 1.9040  Val-Acc: 0.27 Time: 14616.93 Local Steps: 501600\n",
      "36.053883\n",
      "Train: Step:  2508 Val-Loss: 1.8904  Val-Acc: 0.28 Time: 14668.95 Local Steps: 503400\n",
      "36.36855\n",
      "Train: Step:  2517 Val-Loss: 1.9300  Val-Acc: 0.27 Time: 14725.86 Local Steps: 505200\n",
      "35.498425\n",
      "Train: Step:  2527 Val-Loss: 1.8760  Val-Acc: 0.27 Time: 14780.86 Local Steps: 507200\n",
      "35.64151\n",
      "Train: Step:  2536 Val-Loss: 1.8828  Val-Acc: 0.30 Time: 14833.35 Local Steps: 509000\n",
      "37.750786\n",
      "Train: Step:  2545 Val-Loss: 1.9666  Val-Acc: 0.28 Time: 14884.03 Local Steps: 510800\n",
      "35.820587\n",
      "Train: Step:  2554 Val-Loss: 1.9041  Val-Acc: 0.30 Time: 14938.11 Local Steps: 512600\n",
      "36.065582\n",
      "Train: Step:  2562 Val-Loss: 1.9193  Val-Acc: 0.29 Time: 14988.51 Local Steps: 514200\n",
      "36.166534\n",
      "Train: Step:  2572 Val-Loss: 1.9458  Val-Acc: 0.26 Time: 15044.56 Local Steps: 516200\n",
      "35.18029\n",
      "Train: Step:  2581 Val-Loss: 1.8487  Val-Acc: 0.30 Time: 15095.51 Local Steps: 518000\n",
      "36.070953\n",
      "Train: Step:  2591 Val-Loss: 1.9434  Val-Acc: 0.26 Time: 15150.42 Local Steps: 520000\n",
      "37.8219\n",
      "Train: Step:  2599 Val-Loss: 2.0600  Val-Acc: 0.20 Time: 15201.76 Local Steps: 521600\n",
      "36.124786\n",
      "Train: Step:  2608 Val-Loss: 1.9440  Val-Acc: 0.27 Time: 15253.93 Local Steps: 523400\n",
      "35.39966\n",
      "Train: Step:  2618 Val-Loss: 1.9579  Val-Acc: 0.27 Time: 15312.91 Local Steps: 525400\n",
      "36.08258\n",
      "Train: Step:  2627 Val-Loss: 1.9274  Val-Acc: 0.27 Time: 15364.76 Local Steps: 527200\n",
      "36.68299\n",
      "Train: Step:  2636 Val-Loss: 1.9816  Val-Acc: 0.25 Time: 15417.78 Local Steps: 529000\n",
      "35.667343\n",
      "Train: Step:  2646 Val-Loss: 1.9543  Val-Acc: 0.24 Time: 15472.82 Local Steps: 531000\n",
      "35.625015\n",
      "Train: Step:  2655 Val-Loss: 2.0008  Val-Acc: 0.22 Time: 15528.00 Local Steps: 532800\n",
      "36.147068\n",
      "Train: Step:  2664 Val-Loss: 2.0176  Val-Acc: 0.24 Time: 15582.26 Local Steps: 534600\n",
      "35.884575\n",
      "Train: Step:  2673 Val-Loss: 1.9512  Val-Acc: 0.24 Time: 15634.59 Local Steps: 536400\n",
      "35.412697\n",
      "Train: Step:  2683 Val-Loss: 1.9139  Val-Acc: 0.24 Time: 15692.17 Local Steps: 538400\n",
      "36.69156\n",
      "Train: Step:  2692 Val-Loss: 2.0736  Val-Acc: 0.24 Time: 15746.73 Local Steps: 540200\n",
      "36.09169\n",
      "Train: Step:  2702 Val-Loss: 1.9518  Val-Acc: 0.28 Time: 15802.80 Local Steps: 542200\n",
      "36.749428\n",
      "Train: Step:  2711 Val-Loss: 1.9828  Val-Acc: 0.23 Time: 15853.98 Local Steps: 544000\n",
      "35.36039\n",
      "Train: Step:  2720 Val-Loss: 1.8704  Val-Acc: 0.27 Time: 15905.81 Local Steps: 545800\n",
      "36.109577\n",
      "Train: Step:  2730 Val-Loss: 1.9586  Val-Acc: 0.28 Time: 15963.08 Local Steps: 547800\n",
      "34.901466\n",
      "Train: Step:  2740 Val-Loss: 1.9070  Val-Acc: 0.30 Time: 16018.75 Local Steps: 549800\n",
      "34.70155\n",
      "Train: Step:  2749 Val-Loss: 1.8783  Val-Acc: 0.31 Time: 16072.38 Local Steps: 551600\n",
      "36.648945\n",
      "Train: Step:  2758 Val-Loss: 1.9313  Val-Acc: 0.27 Time: 16123.36 Local Steps: 553400\n",
      "35.387\n",
      "Train: Step:  2766 Val-Loss: 1.8957  Val-Acc: 0.28 Time: 16174.54 Local Steps: 555000\n",
      "35.389366\n",
      "Train: Step:  2776 Val-Loss: 1.9233  Val-Acc: 0.24 Time: 16231.89 Local Steps: 557000\n",
      "35.02645\n",
      "Train: Step:  2785 Val-Loss: 1.9396  Val-Acc: 0.27 Time: 16282.23 Local Steps: 558800\n",
      "35.860027\n",
      "Train: Step:  2794 Val-Loss: 1.9302  Val-Acc: 0.28 Time: 16334.89 Local Steps: 560600\n",
      "35.066944\n",
      "Train: Step:  2803 Val-Loss: 1.8773  Val-Acc: 0.31 Time: 16388.88 Local Steps: 562400\n",
      "35.11931\n",
      "Train: Step:  2813 Val-Loss: 1.9715  Val-Acc: 0.26 Time: 16443.65 Local Steps: 564400\n",
      "35.623657\n",
      "Train: Step:  2822 Val-Loss: 1.9632  Val-Acc: 0.25 Time: 16495.08 Local Steps: 566200\n",
      "34.71399\n",
      "Train: Step:  2831 Val-Loss: 1.8698  Val-Acc: 0.29 Time: 16549.57 Local Steps: 568000\n",
      "34.682503\n",
      "Train: Step:  2840 Val-Loss: 1.9369  Val-Acc: 0.27 Time: 16599.79 Local Steps: 569800\n",
      "35.49442\n",
      "Train: Step:  2848 Val-Loss: 1.9757  Val-Acc: 0.24 Time: 16651.89 Local Steps: 571400\n",
      "36.099155\n",
      "Train: Step:  2857 Val-Loss: 1.9354  Val-Acc: 0.27 Time: 16703.32 Local Steps: 573200\n",
      "35.831753\n",
      "Train: Step:  2867 Val-Loss: 1.9829  Val-Acc: 0.22 Time: 16756.72 Local Steps: 575200\n",
      "35.568893\n",
      "Train: Step:  2877 Val-Loss: 1.9876  Val-Acc: 0.26 Time: 16815.81 Local Steps: 577200\n",
      "35.075184\n",
      "Train: Step:  2886 Val-Loss: 1.8540  Val-Acc: 0.31 Time: 16871.21 Local Steps: 579000\n",
      "36.498585\n",
      "Train: Step:  2895 Val-Loss: 1.9774  Val-Acc: 0.27 Time: 16923.43 Local Steps: 580800\n",
      "35.2917\n",
      "Train: Step:  2904 Val-Loss: 1.8768  Val-Acc: 0.28 Time: 16975.96 Local Steps: 582600\n",
      "36.557976\n",
      "Train: Step:  2912 Val-Loss: 1.8699  Val-Acc: 0.30 Time: 17026.88 Local Steps: 584200\n",
      "35.084244\n",
      "Train: Step:  2921 Val-Loss: 1.9022  Val-Acc: 0.27 Time: 17078.29 Local Steps: 586000\n",
      "34.83657\n",
      "Train: Step:  2930 Val-Loss: 1.8801  Val-Acc: 0.26 Time: 17130.34 Local Steps: 587800\n",
      "35.27662\n",
      "Train: Step:  2939 Val-Loss: 1.8925  Val-Acc: 0.30 Time: 17184.33 Local Steps: 589600\n",
      "34.859722\n",
      "Train: Step:  2948 Val-Loss: 1.9157  Val-Acc: 0.27 Time: 17236.74 Local Steps: 591400\n",
      "35.148132\n",
      "Train: Step:  2957 Val-Loss: 1.8868  Val-Acc: 0.28 Time: 17291.95 Local Steps: 593200\n",
      "34.58284\n",
      "Train: Step:  2966 Val-Loss: 1.8731  Val-Acc: 0.30 Time: 17343.11 Local Steps: 595000\n",
      "36.080708\n",
      "Train: Step:  2975 Val-Loss: 1.9243  Val-Acc: 0.25 Time: 17394.35 Local Steps: 596800\n",
      "35.276505\n",
      "Train: Step:  2984 Val-Loss: 1.8880  Val-Acc: 0.29 Time: 17450.29 Local Steps: 598600\n",
      "35.107452\n",
      "Train: Step:  2994 Val-Loss: 1.8284  Val-Acc: 0.30 Time: 17503.38 Local Steps: 600600\n",
      "35.43998\n",
      "Train: Step:  3003 Val-Loss: 1.9670  Val-Acc: 0.23 Time: 17556.23 Local Steps: 602400\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "34.919777\n",
      "Train: Step:  3011 Val-Loss: 1.9324  Val-Acc: 0.21 Time: 17606.87 Local Steps: 604000\n",
      "35.566757\n",
      "Train: Step:  3021 Val-Loss: 1.9198  Val-Acc: 0.27 Time: 17657.86 Local Steps: 606000\n",
      "36.063965\n",
      "Train: Step:  3031 Val-Loss: 2.0990  Val-Acc: 0.22 Time: 17714.68 Local Steps: 608000\n",
      "34.71428\n",
      "Train: Step:  3041 Val-Loss: 1.9240  Val-Acc: 0.25 Time: 17769.15 Local Steps: 610000\n",
      "35.98568\n",
      "Train: Step:  3050 Val-Loss: 1.8674  Val-Acc: 0.28 Time: 17824.47 Local Steps: 611800\n",
      "35.010098\n",
      "Train: Step:  3059 Val-Loss: 1.8943  Val-Acc: 0.29 Time: 17879.35 Local Steps: 613600\n",
      "34.909576\n",
      "Train: Step:  3068 Val-Loss: 1.9141  Val-Acc: 0.28 Time: 17935.79 Local Steps: 615400\n",
      "35.00322\n",
      "Train: Step:  3078 Val-Loss: 1.9746  Val-Acc: 0.26 Time: 17991.45 Local Steps: 617400\n",
      "35.015614\n",
      "Train: Step:  3088 Val-Loss: 1.8763  Val-Acc: 0.29 Time: 18048.76 Local Steps: 619400\n",
      "34.55665\n",
      "Train: Step:  3097 Val-Loss: 1.9153  Val-Acc: 0.32 Time: 18102.38 Local Steps: 621200\n",
      "35.890686\n",
      "Train: Step:  3106 Val-Loss: 1.8854  Val-Acc: 0.27 Time: 18152.89 Local Steps: 623000\n",
      "35.212433\n",
      "Train: Step:  3115 Val-Loss: 1.8865  Val-Acc: 0.29 Time: 18204.99 Local Steps: 624800\n",
      "34.628426\n",
      "Train: Step:  3124 Val-Loss: 1.8428  Val-Acc: 0.31 Time: 18257.52 Local Steps: 626600\n",
      "35.101974\n",
      "Train: Step:  3133 Val-Loss: 1.9003  Val-Acc: 0.27 Time: 18316.14 Local Steps: 628400\n",
      "35.442528\n",
      "Train: Step:  3143 Val-Loss: 1.8932  Val-Acc: 0.28 Time: 18371.07 Local Steps: 630400\n",
      "33.982018\n",
      "Train: Step:  3153 Val-Loss: 1.8271  Val-Acc: 0.32 Time: 18426.57 Local Steps: 632400\n",
      "35.335693\n",
      "Train: Step:  3162 Val-Loss: 1.8915  Val-Acc: 0.33 Time: 18477.87 Local Steps: 634200\n",
      "34.94368\n",
      "Train: Step:  3171 Val-Loss: 1.8642  Val-Acc: 0.31 Time: 18531.82 Local Steps: 636000\n",
      "34.628082\n",
      "Train: Step:  3180 Val-Loss: 1.8683  Val-Acc: 0.33 Time: 18584.25 Local Steps: 637800\n",
      "34.14852\n",
      "Train: Step:  3189 Val-Loss: 1.8357  Val-Acc: 0.32 Time: 18638.58 Local Steps: 639600\n",
      "34.855804\n",
      "Train: Step:  3197 Val-Loss: 1.8934  Val-Acc: 0.29 Time: 18689.51 Local Steps: 641200\n",
      "35.432266\n",
      "Train: Step:  3206 Val-Loss: 1.8808  Val-Acc: 0.26 Time: 18743.57 Local Steps: 643000\n",
      "34.573242\n",
      "Train: Step:  3216 Val-Loss: 1.8622  Val-Acc: 0.30 Time: 18795.95 Local Steps: 645000\n",
      "35.143745\n",
      "Train: Step:  3226 Val-Loss: 1.9857  Val-Acc: 0.23 Time: 18857.22 Local Steps: 647000\n",
      "34.599102\n",
      "Train: Step:  3235 Val-Loss: 1.9002  Val-Acc: 0.29 Time: 18908.19 Local Steps: 648800\n",
      "34.181828\n",
      "Train: Step:  3244 Val-Loss: 1.8756  Val-Acc: 0.28 Time: 18961.52 Local Steps: 650600\n",
      "34.52715\n",
      "Train: Step:  3253 Val-Loss: 1.9149  Val-Acc: 0.28 Time: 19018.97 Local Steps: 652400\n",
      "34.25444\n",
      "Train: Step:  3262 Val-Loss: 1.8162  Val-Acc: 0.34 Time: 19069.49 Local Steps: 654200\n",
      "34.2758\n",
      "Train: Step:  3271 Val-Loss: 1.8599  Val-Acc: 0.29 Time: 19121.96 Local Steps: 656000\n",
      "34.339638\n",
      "Train: Step:  3280 Val-Loss: 1.9427  Val-Acc: 0.27 Time: 19174.20 Local Steps: 657800\n",
      "34.830246\n",
      "Train: Step:  3290 Val-Loss: 1.9728  Val-Acc: 0.26 Time: 19229.66 Local Steps: 659800\n",
      "34.57087\n",
      "Train: Step:  3298 Val-Loss: 1.9421  Val-Acc: 0.30 Time: 19281.46 Local Steps: 661400\n",
      "35.348316\n",
      "Train: Step:  3308 Val-Loss: 1.9135  Val-Acc: 0.28 Time: 19336.33 Local Steps: 663400\n",
      "34.529953\n",
      "Train: Step:  3317 Val-Loss: 1.9091  Val-Acc: 0.30 Time: 19392.34 Local Steps: 665200\n",
      "35.27658\n",
      "Train: Step:  3326 Val-Loss: 1.9530  Val-Acc: 0.24 Time: 19443.35 Local Steps: 667000\n",
      "33.997574\n",
      "Train: Step:  3335 Val-Loss: 1.8020  Val-Acc: 0.30 Time: 19493.98 Local Steps: 668800\n",
      "33.874985\n",
      "Train: Step:  3344 Val-Loss: 1.8413  Val-Acc: 0.29 Time: 19546.79 Local Steps: 670600\n",
      "34.29619\n",
      "Train: Step:  3353 Val-Loss: 1.8624  Val-Acc: 0.31 Time: 19603.16 Local Steps: 672400\n",
      "35.15158\n",
      "Train: Step:  3362 Val-Loss: 1.9644  Val-Acc: 0.25 Time: 19653.57 Local Steps: 674200\n",
      "34.94902\n",
      "Train: Step:  3371 Val-Loss: 1.9050  Val-Acc: 0.24 Time: 19708.17 Local Steps: 676000\n",
      "34.154633\n",
      "Train: Step:  3380 Val-Loss: 1.9763  Val-Acc: 0.29 Time: 19759.33 Local Steps: 677800\n",
      "34.187263\n",
      "Train: Step:  3389 Val-Loss: 1.9681  Val-Acc: 0.26 Time: 19812.62 Local Steps: 679600\n",
      "34.550213\n",
      "Train: Step:  3398 Val-Loss: 1.8872  Val-Acc: 0.27 Time: 19869.01 Local Steps: 681400\n",
      "33.867558\n",
      "Train: Step:  3408 Val-Loss: 1.8329  Val-Acc: 0.29 Time: 19928.74 Local Steps: 683400\n",
      "36.45069\n",
      "Train: Step:  3418 Val-Loss: 2.0088  Val-Acc: 0.28 Time: 19981.92 Local Steps: 685400\n",
      "35.20854\n",
      "Train: Step:  3427 Val-Loss: 1.9499  Val-Acc: 0.24 Time: 20037.31 Local Steps: 687200\n",
      "35.032917\n",
      "Train: Step:  3436 Val-Loss: 1.9368  Val-Acc: 0.27 Time: 20087.35 Local Steps: 689000\n",
      "34.94327\n",
      "Train: Step:  3445 Val-Loss: 1.9929  Val-Acc: 0.24 Time: 20139.26 Local Steps: 690800\n",
      "34.07041\n",
      "Train: Step:  3454 Val-Loss: 1.8515  Val-Acc: 0.31 Time: 20190.52 Local Steps: 692600\n",
      "34.37266\n",
      "Train: Step:  3463 Val-Loss: 1.9508  Val-Acc: 0.20 Time: 20247.47 Local Steps: 694400\n",
      "34.80345\n",
      "Train: Step:  3472 Val-Loss: 1.8882  Val-Acc: 0.26 Time: 20298.42 Local Steps: 696200\n",
      "34.04444\n",
      "Train: Step:  3482 Val-Loss: 1.8766  Val-Acc: 0.29 Time: 20352.27 Local Steps: 698200\n",
      "34.495655\n",
      "Train: Step:  3491 Val-Loss: 1.9402  Val-Acc: 0.26 Time: 20403.90 Local Steps: 700000\n",
      "34.665073\n",
      "Train: Step:  3500 Val-Loss: 1.9839  Val-Acc: 0.25 Time: 20456.47 Local Steps: 701800\n",
      "35.120575\n",
      "Train: Step:  3509 Val-Loss: 1.8834  Val-Acc: 0.27 Time: 20508.03 Local Steps: 703600\n",
      "34.417767\n",
      "Train: Step:  3518 Val-Loss: 1.8577  Val-Acc: 0.28 Time: 20559.18 Local Steps: 705400\n",
      "34.76117\n",
      "Train: Step:  3527 Val-Loss: 1.8862  Val-Acc: 0.29 Time: 20609.97 Local Steps: 707200\n",
      "34.209797\n",
      "Train: Step:  3536 Val-Loss: 1.9314  Val-Acc: 0.27 Time: 20662.40 Local Steps: 709000\n",
      "33.919495\n",
      "Train: Step:  3545 Val-Loss: 1.9193  Val-Acc: 0.28 Time: 20719.25 Local Steps: 710800\n",
      "33.721443\n",
      "Train: Step:  3554 Val-Loss: 1.9084  Val-Acc: 0.26 Time: 20771.09 Local Steps: 712600\n",
      "34.635162\n",
      "Train: Step:  3563 Val-Loss: 1.9155  Val-Acc: 0.29 Time: 20821.42 Local Steps: 714400\n",
      "34.310303\n",
      "Train: Step:  3572 Val-Loss: 1.8661  Val-Acc: 0.26 Time: 20875.09 Local Steps: 716200\n",
      "34.383133\n",
      "Train: Step:  3581 Val-Loss: 1.9238  Val-Acc: 0.27 Time: 20927.08 Local Steps: 718000\n",
      "33.798195\n",
      "Train: Step:  3589 Val-Loss: 1.8296  Val-Acc: 0.31 Time: 20978.00 Local Steps: 719600\n",
      "34.238014\n",
      "Train: Step:  3598 Val-Loss: 1.9476  Val-Acc: 0.27 Time: 21028.99 Local Steps: 721400\n",
      "34.0104\n",
      "Train: Step:  3607 Val-Loss: 1.8623  Val-Acc: 0.30 Time: 21081.14 Local Steps: 723200\n",
      "33.90757\n",
      "Train: Step:  3616 Val-Loss: 1.9072  Val-Acc: 0.27 Time: 21132.21 Local Steps: 725000\n",
      "34.50242\n",
      "Train: Step:  3625 Val-Loss: 1.8371  Val-Acc: 0.30 Time: 21184.71 Local Steps: 726800\n",
      "33.79287\n",
      "Train: Step:  3634 Val-Loss: 1.8862  Val-Acc: 0.29 Time: 21237.41 Local Steps: 728600\n",
      "35.072952\n",
      "Train: Step:  3643 Val-Loss: 1.9228  Val-Acc: 0.25 Time: 21291.38 Local Steps: 730400\n",
      "34.49685\n",
      "Train: Step:  3652 Val-Loss: 1.9760  Val-Acc: 0.24 Time: 21342.65 Local Steps: 732200\n",
      "33.683968\n",
      "Train: Step:  3661 Val-Loss: 1.8304  Val-Acc: 0.30 Time: 21394.33 Local Steps: 734000\n",
      "33.3127\n",
      "Train: Step:  3670 Val-Loss: 1.8390  Val-Acc: 0.32 Time: 21447.04 Local Steps: 735800\n",
      "34.524643\n",
      "Train: Step:  3679 Val-Loss: 1.9358  Val-Acc: 0.26 Time: 21500.27 Local Steps: 737600\n",
      "33.377426\n",
      "Train: Step:  3688 Val-Loss: 1.8046  Val-Acc: 0.34 Time: 21554.03 Local Steps: 739400\n",
      "33.713768\n",
      "Train: Step:  3697 Val-Loss: 1.8562  Val-Acc: 0.29 Time: 21605.43 Local Steps: 741200\n",
      "33.67908\n",
      "Train: Step:  3706 Val-Loss: 1.8989  Val-Acc: 0.30 Time: 21659.66 Local Steps: 743000\n",
      "33.675644\n",
      "Train: Step:  3715 Val-Loss: 1.8919  Val-Acc: 0.27 Time: 21711.06 Local Steps: 744800\n",
      "34.412354\n",
      "Train: Step:  3724 Val-Loss: 1.9587  Val-Acc: 0.25 Time: 21764.35 Local Steps: 746600\n",
      "34.67502\n",
      "Train: Step:  3733 Val-Loss: 1.8517  Val-Acc: 0.32 Time: 21816.42 Local Steps: 748400\n",
      "33.489277\n",
      "Train: Step:  3742 Val-Loss: 1.8852  Val-Acc: 0.26 Time: 21869.42 Local Steps: 750200\n",
      "33.848335\n",
      "Train: Step:  3751 Val-Loss: 1.8657  Val-Acc: 0.27 Time: 21922.82 Local Steps: 752000\n",
      "34.610977\n",
      "Train: Step:  3760 Val-Loss: 1.8520  Val-Acc: 0.33 Time: 21978.14 Local Steps: 753800\n",
      "33.33931\n",
      "Train: Step:  3770 Val-Loss: 1.8611  Val-Acc: 0.28 Time: 22034.21 Local Steps: 755800\n",
      "34.26487\n",
      "Train: Step:  3780 Val-Loss: 2.0014  Val-Acc: 0.26 Time: 22088.56 Local Steps: 757800\n",
      "33.869656\n",
      "Train: Step:  3789 Val-Loss: 1.9503  Val-Acc: 0.22 Time: 22142.18 Local Steps: 759600\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "34.387268\n",
      "Train: Step:  3798 Val-Loss: 1.9501  Val-Acc: 0.24 Time: 22192.83 Local Steps: 761400\n",
      "33.88668\n",
      "Train: Step:  3806 Val-Loss: 1.8941  Val-Acc: 0.26 Time: 22243.31 Local Steps: 763000\n",
      "34.465977\n",
      "Train: Step:  3816 Val-Loss: 1.9115  Val-Acc: 0.31 Time: 22297.91 Local Steps: 765000\n",
      "33.795044\n",
      "Train: Step:  3825 Val-Loss: 1.9100  Val-Acc: 0.25 Time: 22353.15 Local Steps: 766800\n",
      "33.551918\n",
      "Train: Step:  3834 Val-Loss: 1.8364  Val-Acc: 0.31 Time: 22411.19 Local Steps: 768600\n",
      "33.986404\n",
      "Train: Step:  3843 Val-Loss: 1.8957  Val-Acc: 0.28 Time: 22462.59 Local Steps: 770400\n",
      "34.03901\n",
      "Train: Step:  3852 Val-Loss: 1.9396  Val-Acc: 0.27 Time: 22514.74 Local Steps: 772200\n",
      "34.377518\n",
      "Train: Step:  3860 Val-Loss: 1.9271  Val-Acc: 0.23 Time: 22566.93 Local Steps: 773800\n",
      "34.66175\n",
      "Train: Step:  3869 Val-Loss: 1.9656  Val-Acc: 0.23 Time: 22618.40 Local Steps: 775600\n",
      "35.143547\n",
      "Train: Step:  3878 Val-Loss: 1.9565  Val-Acc: 0.30 Time: 22670.05 Local Steps: 777400\n",
      "33.408085\n",
      "Train: Step:  3887 Val-Loss: 1.8535  Val-Acc: 0.30 Time: 22721.38 Local Steps: 779200\n",
      "33.947727\n",
      "Train: Step:  3895 Val-Loss: 1.9901  Val-Acc: 0.21 Time: 22773.55 Local Steps: 780800\n",
      "33.7834\n",
      "Train: Step:  3904 Val-Loss: 1.8848  Val-Acc: 0.29 Time: 22824.86 Local Steps: 782600\n",
      "34.25357\n",
      "Train: Step:  3913 Val-Loss: 1.8914  Val-Acc: 0.24 Time: 22878.40 Local Steps: 784400\n",
      "34.211365\n",
      "Train: Step:  3922 Val-Loss: 1.9964  Val-Acc: 0.25 Time: 22931.17 Local Steps: 786200\n",
      "34.983696\n",
      "Train: Step:  3932 Val-Loss: 1.9428  Val-Acc: 0.22 Time: 22984.50 Local Steps: 788200\n",
      "33.52763\n",
      "Train: Step:  3941 Val-Loss: 1.8599  Val-Acc: 0.32 Time: 23038.32 Local Steps: 790000\n",
      "33.09035\n",
      "Train: Step:  3950 Val-Loss: 1.7922  Val-Acc: 0.33 Time: 23091.61 Local Steps: 791800\n",
      "34.048244\n",
      "Train: Step:  3959 Val-Loss: 1.9293  Val-Acc: 0.25 Time: 23147.23 Local Steps: 793600\n",
      "34.044594\n",
      "Train: Step:  3968 Val-Loss: 1.8719  Val-Acc: 0.28 Time: 23199.30 Local Steps: 795400\n",
      "33.752434\n",
      "Train: Step:  3978 Val-Loss: 1.9184  Val-Acc: 0.30 Time: 23253.31 Local Steps: 797400\n",
      "33.75347\n",
      "Train: Step:  3987 Val-Loss: 1.8802  Val-Acc: 0.30 Time: 23309.23 Local Steps: 799200\n",
      "33.53516\n",
      "Train: Step:  3996 Val-Loss: 1.9126  Val-Acc: 0.29 Time: 23359.98 Local Steps: 801000\n",
      "33.408188\n",
      "Train: Step:  4005 Val-Loss: 1.8936  Val-Acc: 0.31 Time: 23416.40 Local Steps: 802800\n",
      "33.21196\n",
      "Train: Step:  4014 Val-Loss: 1.8412  Val-Acc: 0.32 Time: 23468.03 Local Steps: 804600\n",
      "33.64368\n",
      "Train: Step:  4023 Val-Loss: 1.8925  Val-Acc: 0.29 Time: 23518.53 Local Steps: 806400\n",
      "33.805473\n",
      "Train: Step:  4033 Val-Loss: 1.9953  Val-Acc: 0.23 Time: 23574.84 Local Steps: 808400\n",
      "34.14477\n",
      "Train: Step:  4041 Val-Loss: 1.8871  Val-Acc: 0.28 Time: 23626.63 Local Steps: 810000\n",
      "33.644917\n",
      "Train: Step:  4051 Val-Loss: 1.9087  Val-Acc: 0.28 Time: 23683.89 Local Steps: 812000\n",
      "34.57753\n",
      "Train: Step:  4060 Val-Loss: 1.9730  Val-Acc: 0.21 Time: 23738.13 Local Steps: 813800\n",
      "34.529915\n",
      "Train: Step:  4069 Val-Loss: 1.9103  Val-Acc: 0.24 Time: 23790.08 Local Steps: 815600\n",
      "36.159637\n",
      "Train: Step:  4079 Val-Loss: 2.1697  Val-Acc: 0.24 Time: 23847.26 Local Steps: 817600\n",
      "34.26201\n",
      "Train: Step:  4089 Val-Loss: 1.9423  Val-Acc: 0.24 Time: 23900.97 Local Steps: 819600\n",
      "33.938164\n",
      "Train: Step:  4099 Val-Loss: 1.9166  Val-Acc: 0.29 Time: 23951.76 Local Steps: 821600\n",
      "33.088673\n",
      "Train: Step:  4108 Val-Loss: 1.8778  Val-Acc: 0.30 Time: 24008.22 Local Steps: 823400\n",
      "33.55789\n",
      "Train: Step:  4117 Val-Loss: 1.8875  Val-Acc: 0.30 Time: 24059.09 Local Steps: 825200\n",
      "33.587288\n",
      "Train: Step:  4126 Val-Loss: 1.8968  Val-Acc: 0.29 Time: 24117.35 Local Steps: 827000\n",
      "34.162285\n",
      "Train: Step:  4135 Val-Loss: 1.9604  Val-Acc: 0.27 Time: 24171.93 Local Steps: 828800\n",
      "33.836662\n",
      "Train: Step:  4145 Val-Loss: 1.9039  Val-Acc: 0.28 Time: 24228.70 Local Steps: 830800\n",
      "33.205048\n",
      "Train: Step:  4155 Val-Loss: 1.8722  Val-Acc: 0.30 Time: 24279.83 Local Steps: 832800\n",
      "33.153194\n",
      "Train: Step:  4164 Val-Loss: 1.8318  Val-Acc: 0.32 Time: 24335.99 Local Steps: 834600\n",
      "32.834133\n",
      "Train: Step:  4173 Val-Loss: 1.9066  Val-Acc: 0.31 Time: 24388.61 Local Steps: 836400\n",
      "33.869724\n",
      "Train: Step:  4182 Val-Loss: 2.0098  Val-Acc: 0.24 Time: 24439.21 Local Steps: 838200\n",
      "32.763535\n",
      "Train: Step:  4191 Val-Loss: 1.8381  Val-Acc: 0.29 Time: 24492.49 Local Steps: 840000\n",
      "32.961643\n",
      "Train: Step:  4200 Val-Loss: 1.8442  Val-Acc: 0.33 Time: 24542.59 Local Steps: 841800\n",
      "33.024582\n",
      "Train: Step:  4209 Val-Loss: 1.8918  Val-Acc: 0.30 Time: 24597.53 Local Steps: 843600\n",
      "33.01044\n",
      "Train: Step:  4218 Val-Loss: 1.8734  Val-Acc: 0.30 Time: 24649.41 Local Steps: 845400\n",
      "33.0905\n",
      "Train: Step:  4228 Val-Loss: 1.9576  Val-Acc: 0.27 Time: 24704.76 Local Steps: 847400\n",
      "33.649162\n",
      "Train: Step:  4237 Val-Loss: 1.8591  Val-Acc: 0.31 Time: 24757.71 Local Steps: 849200\n",
      "33.403534\n",
      "Train: Step:  4246 Val-Loss: 1.9176  Val-Acc: 0.29 Time: 24811.71 Local Steps: 851000\n",
      "33.04064\n",
      "Train: Step:  4255 Val-Loss: 1.8739  Val-Acc: 0.27 Time: 24864.77 Local Steps: 852800\n",
      "33.988808\n",
      "Train: Step:  4264 Val-Loss: 1.8983  Val-Acc: 0.28 Time: 24915.83 Local Steps: 854600\n",
      "33.027023\n",
      "Train: Step:  4273 Val-Loss: 1.8469  Val-Acc: 0.29 Time: 24968.40 Local Steps: 856400\n",
      "32.648617\n",
      "Train: Step:  4282 Val-Loss: 1.8729  Val-Acc: 0.32 Time: 25021.79 Local Steps: 858200\n",
      "33.21089\n",
      "Train: Step:  4292 Val-Loss: 1.8378  Val-Acc: 0.28 Time: 25077.40 Local Steps: 860200\n",
      "32.861298\n",
      "Train: Step:  4301 Val-Loss: 1.8423  Val-Acc: 0.31 Time: 25131.49 Local Steps: 862000\n",
      "33.279346\n",
      "Train: Step:  4310 Val-Loss: 2.0339  Val-Acc: 0.23 Time: 25184.59 Local Steps: 863800\n",
      "33.558487\n",
      "Train: Step:  4319 Val-Loss: 1.9282  Val-Acc: 0.26 Time: 25239.72 Local Steps: 865600\n",
      "32.38861\n",
      "Train: Step:  4328 Val-Loss: 1.8169  Val-Acc: 0.33 Time: 25291.41 Local Steps: 867400\n",
      "33.448555\n",
      "Train: Step:  4337 Val-Loss: 1.8701  Val-Acc: 0.32 Time: 25345.82 Local Steps: 869200\n",
      "33.846508\n",
      "Train: Step:  4347 Val-Loss: 1.9963  Val-Acc: 0.22 Time: 25401.45 Local Steps: 871200\n",
      "34.569626\n",
      "Train: Step:  4356 Val-Loss: 1.9346  Val-Acc: 0.24 Time: 25451.72 Local Steps: 873000\n",
      "33.93894\n",
      "Train: Step:  4365 Val-Loss: 1.9405  Val-Acc: 0.28 Time: 25503.76 Local Steps: 874800\n",
      "34.63509\n",
      "Train: Step:  4373 Val-Loss: 2.1137  Val-Acc: 0.26 Time: 25554.27 Local Steps: 876400\n",
      "33.312607\n",
      "Train: Step:  4382 Val-Loss: 1.9845  Val-Acc: 0.23 Time: 25607.13 Local Steps: 878200\n",
      "33.269993\n",
      "Train: Step:  4392 Val-Loss: 1.9720  Val-Acc: 0.28 Time: 25661.58 Local Steps: 880200\n",
      "34.013058\n",
      "Train: Step:  4401 Val-Loss: 1.9340  Val-Acc: 0.23 Time: 25714.73 Local Steps: 882000\n",
      "34.19301\n",
      "Train: Step:  4410 Val-Loss: 2.1051  Val-Acc: 0.23 Time: 25769.43 Local Steps: 883800\n",
      "33.699646\n",
      "Train: Step:  4419 Val-Loss: 1.9080  Val-Acc: 0.29 Time: 25823.18 Local Steps: 885600\n",
      "33.380047\n",
      "Train: Step:  4428 Val-Loss: 1.8323  Val-Acc: 0.32 Time: 25876.78 Local Steps: 887400\n",
      "34.614\n",
      "Train: Step:  4437 Val-Loss: 2.1368  Val-Acc: 0.24 Time: 25931.13 Local Steps: 889200\n",
      "32.56747\n",
      "Train: Step:  4446 Val-Loss: 1.8336  Val-Acc: 0.31 Time: 25981.99 Local Steps: 891000\n",
      "32.619995\n",
      "Train: Step:  4455 Val-Loss: 1.8597  Val-Acc: 0.32 Time: 26034.86 Local Steps: 892800\n",
      "32.803585\n",
      "Train: Step:  4464 Val-Loss: 1.8387  Val-Acc: 0.32 Time: 26086.12 Local Steps: 894600\n",
      "33.77075\n",
      "Train: Step:  4473 Val-Loss: 1.8908  Val-Acc: 0.25 Time: 26143.74 Local Steps: 896400\n",
      "33.433487\n",
      "Train: Step:  4482 Val-Loss: 1.9265  Val-Acc: 0.26 Time: 26198.39 Local Steps: 898200\n",
      "33.067642\n",
      "Train: Step:  4492 Val-Loss: 1.8621  Val-Acc: 0.30 Time: 26253.46 Local Steps: 900200\n",
      "32.618984\n",
      "Train: Step:  4501 Val-Loss: 1.8399  Val-Acc: 0.31 Time: 26306.27 Local Steps: 902000\n",
      "32.480755\n",
      "Train: Step:  4511 Val-Loss: 1.8528  Val-Acc: 0.30 Time: 26361.32 Local Steps: 904000\n",
      "33.30265\n",
      "Train: Step:  4519 Val-Loss: 1.9440  Val-Acc: 0.30 Time: 26413.97 Local Steps: 905600\n",
      "33.784283\n",
      "Train: Step:  4529 Val-Loss: 2.2215  Val-Acc: 0.27 Time: 26466.28 Local Steps: 907600\n",
      "34.46068\n",
      "Train: Step:  4538 Val-Loss: 2.0098  Val-Acc: 0.28 Time: 26520.42 Local Steps: 909400\n",
      "33.164455\n",
      "Train: Step:  4547 Val-Loss: 1.9166  Val-Acc: 0.28 Time: 26573.46 Local Steps: 911200\n",
      "32.781467\n",
      "Train: Step:  4556 Val-Loss: 1.8863  Val-Acc: 0.29 Time: 26624.47 Local Steps: 913000\n",
      "33.407593\n",
      "Train: Step:  4565 Val-Loss: 1.8902  Val-Acc: 0.30 Time: 26679.66 Local Steps: 914800\n",
      "33.385323\n",
      "Train: Step:  4575 Val-Loss: 1.8925  Val-Acc: 0.26 Time: 26734.50 Local Steps: 916800\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "33.52645\n",
      "Train: Step:  4584 Val-Loss: 1.9277  Val-Acc: 0.29 Time: 26788.03 Local Steps: 918600\n",
      "33.56839\n",
      "Train: Step:  4592 Val-Loss: 2.0109  Val-Acc: 0.28 Time: 26839.63 Local Steps: 920200\n",
      "33.259895\n",
      "Train: Step:  4601 Val-Loss: 1.9116  Val-Acc: 0.27 Time: 26891.95 Local Steps: 922000\n",
      "32.78888\n",
      "Train: Step:  4611 Val-Loss: 1.9158  Val-Acc: 0.23 Time: 26947.72 Local Steps: 924000\n",
      "32.303207\n",
      "Train: Step:  4620 Val-Loss: 1.9243  Val-Acc: 0.29 Time: 26998.68 Local Steps: 925800\n",
      "32.990265\n",
      "Train: Step:  4629 Val-Loss: 1.9121  Val-Acc: 0.30 Time: 27049.28 Local Steps: 927600\n",
      "32.92137\n",
      "Train: Step:  4638 Val-Loss: 1.9396  Val-Acc: 0.24 Time: 27104.66 Local Steps: 929400\n",
      "33.154617\n",
      "Train: Step:  4647 Val-Loss: 1.9107  Val-Acc: 0.30 Time: 27156.45 Local Steps: 931200\n",
      "32.70468\n",
      "Train: Step:  4657 Val-Loss: 1.7946  Val-Acc: 0.34 Time: 27217.13 Local Steps: 933200\n",
      "34.77782\n",
      "Train: Step:  4667 Val-Loss: 2.1703  Val-Acc: 0.19 Time: 27271.54 Local Steps: 935200\n",
      "33.164276\n",
      "Train: Step:  4677 Val-Loss: 1.8903  Val-Acc: 0.29 Time: 27326.04 Local Steps: 937200\n",
      "32.98711\n",
      "Train: Step:  4686 Val-Loss: 1.9416  Val-Acc: 0.28 Time: 27379.27 Local Steps: 939000\n",
      "32.465046\n",
      "Train: Step:  4695 Val-Loss: 1.8282  Val-Acc: 0.29 Time: 27431.56 Local Steps: 940800\n",
      "33.242275\n",
      "Train: Step:  4704 Val-Loss: 1.8522  Val-Acc: 0.27 Time: 27483.80 Local Steps: 942600\n",
      "32.95921\n",
      "Train: Step:  4713 Val-Loss: 1.8043  Val-Acc: 0.34 Time: 27535.17 Local Steps: 944400\n",
      "33.161297\n",
      "Train: Step:  4722 Val-Loss: 1.8799  Val-Acc: 0.30 Time: 27585.87 Local Steps: 946200\n",
      "34.148895\n",
      "Train: Step:  4731 Val-Loss: 2.0618  Val-Acc: 0.24 Time: 27636.24 Local Steps: 948000\n",
      "32.741592\n",
      "Train: Step:  4739 Val-Loss: 1.8292  Val-Acc: 0.33 Time: 27686.35 Local Steps: 949600\n",
      "32.8535\n",
      "Train: Step:  4748 Val-Loss: 1.9620  Val-Acc: 0.19 Time: 27740.50 Local Steps: 951400\n",
      "32.67515\n",
      "Train: Step:  4757 Val-Loss: 1.9119  Val-Acc: 0.23 Time: 27791.50 Local Steps: 953200\n",
      "32.76435\n",
      "Train: Step:  4766 Val-Loss: 2.0150  Val-Acc: 0.25 Time: 27847.58 Local Steps: 955000\n",
      "32.473907\n",
      "Train: Step:  4786 Val-Loss: 1.8839  Val-Acc: 0.30 Time: 27958.93 Local Steps: 959000\n",
      "32.89216\n",
      "Train: Step:  4795 Val-Loss: 1.8583  Val-Acc: 0.33 Time: 28012.59 Local Steps: 960800\n",
      "33.353752\n",
      "Train: Step:  4804 Val-Loss: 1.9231  Val-Acc: 0.28 Time: 28068.07 Local Steps: 962600\n",
      "32.61824\n",
      "Train: Step:  4813 Val-Loss: 1.8311  Val-Acc: 0.30 Time: 28123.15 Local Steps: 964400\n",
      "32.55091\n",
      "Train: Step:  4822 Val-Loss: 1.9172  Val-Acc: 0.27 Time: 28173.88 Local Steps: 966200\n",
      "32.426147\n",
      "Train: Step:  4831 Val-Loss: 1.8607  Val-Acc: 0.31 Time: 28225.83 Local Steps: 968000\n",
      "32.454212\n",
      "Train: Step:  4840 Val-Loss: 1.8626  Val-Acc: 0.34 Time: 28279.71 Local Steps: 969800\n",
      "31.979546\n",
      "Train: Step:  4849 Val-Loss: 1.7986  Val-Acc: 0.35 Time: 28335.21 Local Steps: 971600\n",
      "32.621326\n",
      "Train: Step:  4867 Val-Loss: 1.9645  Val-Acc: 0.27 Time: 28439.67 Local Steps: 975200\n",
      "33.406834\n",
      "Train: Step:  4886 Val-Loss: 1.9345  Val-Acc: 0.30 Time: 28544.87 Local Steps: 979000\n",
      "32.48296\n",
      "Train: Step:  4895 Val-Loss: 1.8328  Val-Acc: 0.32 Time: 28595.87 Local Steps: 980800\n",
      "32.33628\n",
      "Train: Step:  4904 Val-Loss: 1.8346  Val-Acc: 0.29 Time: 28650.76 Local Steps: 982600\n",
      "32.57216\n",
      "Train: Step:  4913 Val-Loss: 1.9010  Val-Acc: 0.28 Time: 28703.62 Local Steps: 984400\n",
      "32.392853\n",
      "Train: Step:  4922 Val-Loss: 1.8852  Val-Acc: 0.27 Time: 28754.89 Local Steps: 986200\n",
      "32.31698\n",
      "Train: Step:  4931 Val-Loss: 1.8838  Val-Acc: 0.27 Time: 28808.50 Local Steps: 988000\n",
      "31.662256\n",
      "Train: Step:  4939 Val-Loss: 1.7785  Val-Acc: 0.32 Time: 28858.88 Local Steps: 989600\n",
      "32.91073\n",
      "Train: Step:  4948 Val-Loss: 2.0372  Val-Acc: 0.23 Time: 28910.76 Local Steps: 991400\n",
      "32.610542\n",
      "Train: Step:  4958 Val-Loss: 1.9262  Val-Acc: 0.29 Time: 28962.14 Local Steps: 993400\n",
      "31.993896\n",
      "Train: Step:  4967 Val-Loss: 1.8906  Val-Acc: 0.25 Time: 29016.53 Local Steps: 995200\n",
      "32.30822\n",
      "Train: Step:  4976 Val-Loss: 1.8849  Val-Acc: 0.27 Time: 29071.61 Local Steps: 997000\n",
      "32.34071\n",
      "Train: Step:  4985 Val-Loss: 1.8669  Val-Acc: 0.31 Time: 29126.03 Local Steps: 998800\n",
      "32.086353\n",
      "Train: Step:  4994 Val-Loss: 1.8197  Val-Acc: 0.33 Time: 29176.82 Local Steps: 1000600\n",
      "33.13949\n",
      "Train: Step:  5003 Val-Loss: 1.9047  Val-Acc: 0.27 Time: 29227.19 Local Steps: 1002400\n",
      "32.54977\n",
      "Train: Step:  5012 Val-Loss: 1.8833  Val-Acc: 0.26 Time: 29281.62 Local Steps: 1004200\n",
      "32.395382\n",
      "Train: Step:  5021 Val-Loss: 1.8668  Val-Acc: 0.31 Time: 29332.68 Local Steps: 1006000\n",
      "32.32452\n",
      "Train: Step:  5029 Val-Loss: 1.8933  Val-Acc: 0.28 Time: 29383.67 Local Steps: 1007600\n",
      "32.492672\n",
      "Train: Step:  5038 Val-Loss: 1.8153  Val-Acc: 0.27 Time: 29437.00 Local Steps: 1009400\n",
      "32.875908\n",
      "Train: Step:  5047 Val-Loss: 1.9464  Val-Acc: 0.21 Time: 29490.28 Local Steps: 1011200\n",
      "32.884056\n",
      "Train: Step:  5056 Val-Loss: 1.9787  Val-Acc: 0.22 Time: 29541.29 Local Steps: 1013000\n",
      "31.603102\n",
      "Train: Step:  5065 Val-Loss: 1.8157  Val-Acc: 0.31 Time: 29595.73 Local Steps: 1014800\n",
      "32.227825\n",
      "Train: Step:  5074 Val-Loss: 1.7865  Val-Acc: 0.35 Time: 29646.18 Local Steps: 1016600\n",
      "32.63562\n",
      "Train: Step:  5083 Val-Loss: 1.8266  Val-Acc: 0.28 Time: 29699.99 Local Steps: 1018400\n",
      "32.611725\n",
      "Train: Step:  5092 Val-Loss: 1.8980  Val-Acc: 0.29 Time: 29754.19 Local Steps: 1020200\n",
      "32.332443\n",
      "Train: Step:  5101 Val-Loss: 1.8313  Val-Acc: 0.28 Time: 29805.20 Local Steps: 1022000\n",
      "32.64669\n",
      "Train: Step:  5110 Val-Loss: 1.8929  Val-Acc: 0.29 Time: 29857.32 Local Steps: 1023800\n",
      "32.55418\n",
      "Train: Step:  5119 Val-Loss: 1.9366  Val-Acc: 0.28 Time: 29909.53 Local Steps: 1025600\n",
      "31.618114\n",
      "Train: Step:  5128 Val-Loss: 1.8114  Val-Acc: 0.29 Time: 29964.13 Local Steps: 1027400\n",
      "31.730469\n",
      "Train: Step:  5137 Val-Loss: 1.8748  Val-Acc: 0.29 Time: 30015.94 Local Steps: 1029200\n",
      "32.65223\n",
      "Train: Step:  5146 Val-Loss: 1.9559  Val-Acc: 0.28 Time: 30070.20 Local Steps: 1031000\n",
      "33.096825\n",
      "Train: Step:  5155 Val-Loss: 2.0646  Val-Acc: 0.26 Time: 30120.79 Local Steps: 1032800\n",
      "32.250008\n",
      "Train: Step:  5164 Val-Loss: 1.8536  Val-Acc: 0.25 Time: 30174.93 Local Steps: 1034600\n",
      "32.708565\n",
      "Train: Step:  5173 Val-Loss: 1.9917  Val-Acc: 0.26 Time: 30227.38 Local Steps: 1036400\n",
      "33.1082\n",
      "Train: Step:  5182 Val-Loss: 1.8840  Val-Acc: 0.25 Time: 30279.06 Local Steps: 1038200\n",
      "32.356796\n",
      "Train: Step:  5191 Val-Loss: 1.8990  Val-Acc: 0.31 Time: 30331.16 Local Steps: 1040000\n",
      "32.68191\n",
      "Train: Step:  5201 Val-Loss: 1.8200  Val-Acc: 0.32 Time: 30388.90 Local Steps: 1042000\n",
      "32.703247\n",
      "Train: Step:  5211 Val-Loss: 1.9817  Val-Acc: 0.25 Time: 30446.36 Local Steps: 1044000\n",
      "32.917145\n",
      "Train: Step:  5221 Val-Loss: 1.8591  Val-Acc: 0.31 Time: 30501.42 Local Steps: 1046000\n",
      "32.343628\n",
      "Train: Step:  5230 Val-Loss: 1.8522  Val-Acc: 0.33 Time: 30554.11 Local Steps: 1047800\n",
      "33.205593\n",
      "Train: Step:  5239 Val-Loss: 1.8495  Val-Acc: 0.29 Time: 30604.87 Local Steps: 1049600\n",
      "32.556206\n",
      "Train: Step:  5248 Val-Loss: 2.0072  Val-Acc: 0.24 Time: 30655.11 Local Steps: 1051400\n",
      "32.021652\n",
      "Train: Step:  5257 Val-Loss: 1.8252  Val-Acc: 0.33 Time: 30705.92 Local Steps: 1053200\n",
      "32.880272\n",
      "Train: Step:  5266 Val-Loss: 2.0191  Val-Acc: 0.22 Time: 30762.44 Local Steps: 1055000\n",
      "33.30241\n",
      "Train: Step:  5275 Val-Loss: 1.8808  Val-Acc: 0.29 Time: 30815.12 Local Steps: 1056800\n",
      "32.39593\n",
      "Train: Step:  5285 Val-Loss: 1.8719  Val-Acc: 0.29 Time: 30867.47 Local Steps: 1058800\n",
      "32.227978\n",
      "Train: Step:  5294 Val-Loss: 1.8494  Val-Acc: 0.27 Time: 30919.13 Local Steps: 1060600\n",
      "32.49711\n",
      "Train: Step:  5303 Val-Loss: 1.9068  Val-Acc: 0.27 Time: 30971.80 Local Steps: 1062400\n",
      "31.619123\n",
      "Train: Step:  5312 Val-Loss: 1.8475  Val-Acc: 0.32 Time: 31024.80 Local Steps: 1064200\n",
      "33.443687\n",
      "Train: Step:  5322 Val-Loss: 1.9808  Val-Acc: 0.24 Time: 31080.38 Local Steps: 1066200\n",
      "31.86187\n",
      "Train: Step:  5330 Val-Loss: 1.8481  Val-Acc: 0.29 Time: 31130.57 Local Steps: 1067800\n",
      "31.705238\n",
      "Train: Step:  5340 Val-Loss: 1.8915  Val-Acc: 0.29 Time: 31185.73 Local Steps: 1069800\n",
      "32.829704\n",
      "Train: Step:  5349 Val-Loss: 1.8676  Val-Acc: 0.31 Time: 31237.05 Local Steps: 1071600\n",
      "31.646698\n",
      "Train: Step:  5358 Val-Loss: 1.8451  Val-Acc: 0.31 Time: 31292.45 Local Steps: 1073400\n",
      "32.166016\n",
      "Train: Step:  5368 Val-Loss: 1.8672  Val-Acc: 0.31 Time: 31346.21 Local Steps: 1075400\n",
      "31.36332\n",
      "Train: Step:  5376 Val-Loss: 1.8124  Val-Acc: 0.36 Time: 31397.93 Local Steps: 1077000\n",
      "33.117867\n",
      "Train: Step:  5386 Val-Loss: 2.1147  Val-Acc: 0.28 Time: 31454.21 Local Steps: 1079000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "32.38417\n",
      "Train: Step:  5395 Val-Loss: 1.9029  Val-Acc: 0.29 Time: 31508.39 Local Steps: 1080800\n",
      "31.686737\n",
      "Train: Step:  5404 Val-Loss: 1.8463  Val-Acc: 0.30 Time: 31561.27 Local Steps: 1082600\n",
      "32.29111\n",
      "Train: Step:  5414 Val-Loss: 1.9176  Val-Acc: 0.26 Time: 31615.70 Local Steps: 1084600\n",
      "31.90366\n",
      "Train: Step:  5423 Val-Loss: 1.9057  Val-Acc: 0.27 Time: 31668.83 Local Steps: 1086400\n",
      "31.942978\n",
      "Train: Step:  5432 Val-Loss: 1.8206  Val-Acc: 0.35 Time: 31720.84 Local Steps: 1088200\n",
      "31.875011\n",
      "Train: Step:  5441 Val-Loss: 1.8989  Val-Acc: 0.28 Time: 31776.17 Local Steps: 1090000\n",
      "32.517532\n",
      "Train: Step:  5450 Val-Loss: 1.8654  Val-Acc: 0.31 Time: 31826.76 Local Steps: 1091800\n",
      "31.504631\n",
      "Train: Step:  5459 Val-Loss: 1.8879  Val-Acc: 0.29 Time: 31881.78 Local Steps: 1093600\n",
      "32.690742\n",
      "Train: Step:  5468 Val-Loss: 1.9705  Val-Acc: 0.26 Time: 31933.32 Local Steps: 1095400\n",
      "31.812841\n",
      "Train: Step:  5477 Val-Loss: 1.8762  Val-Acc: 0.29 Time: 31984.89 Local Steps: 1097200\n",
      "31.878258\n",
      "Train: Step:  5486 Val-Loss: 1.7798  Val-Acc: 0.32 Time: 32038.27 Local Steps: 1099000\n",
      "31.646929\n",
      "Train: Step:  5496 Val-Loss: 1.8806  Val-Acc: 0.29 Time: 32091.61 Local Steps: 1101000\n",
      "32.4581\n",
      "Train: Step:  5505 Val-Loss: 2.0636  Val-Acc: 0.17 Time: 32144.98 Local Steps: 1102800\n",
      "31.471806\n",
      "Train: Step:  5514 Val-Loss: 1.8005  Val-Acc: 0.35 Time: 32195.63 Local Steps: 1104600\n",
      "31.790161\n",
      "Train: Step:  5523 Val-Loss: 1.8137  Val-Acc: 0.30 Time: 32247.24 Local Steps: 1106400\n",
      "31.972013\n",
      "Train: Step:  5533 Val-Loss: 1.9226  Val-Acc: 0.28 Time: 32304.19 Local Steps: 1108400\n",
      "32.98392\n",
      "Train: Step:  5542 Val-Loss: 1.9783  Val-Acc: 0.23 Time: 32358.39 Local Steps: 1110200\n",
      "32.356636\n",
      "Train: Step:  5552 Val-Loss: 1.9224  Val-Acc: 0.27 Time: 32414.64 Local Steps: 1112200\n",
      "31.97187\n",
      "Train: Step:  5561 Val-Loss: 1.9576  Val-Acc: 0.27 Time: 32465.91 Local Steps: 1114000\n",
      "32.101715\n",
      "Train: Step:  5570 Val-Loss: 1.9338  Val-Acc: 0.25 Time: 32516.16 Local Steps: 1115800\n",
      "31.541975\n",
      "Train: Step:  5579 Val-Loss: 1.8376  Val-Acc: 0.33 Time: 32569.51 Local Steps: 1117600\n",
      "31.715467\n",
      "Train: Step:  5588 Val-Loss: 1.7888  Val-Acc: 0.37 Time: 32623.90 Local Steps: 1119400\n",
      "31.352283\n",
      "Train: Step:  5597 Val-Loss: 1.8711  Val-Acc: 0.27 Time: 32674.01 Local Steps: 1121200\n",
      "31.878641\n",
      "Train: Step:  5606 Val-Loss: 1.8348  Val-Acc: 0.29 Time: 32726.10 Local Steps: 1123000\n",
      "31.302834\n",
      "Train: Step:  5615 Val-Loss: 1.8213  Val-Acc: 0.31 Time: 32776.93 Local Steps: 1124800\n",
      "31.480938\n",
      "Train: Step:  5624 Val-Loss: 1.8621  Val-Acc: 0.29 Time: 32831.40 Local Steps: 1126600\n",
      "33.17684\n",
      "Train: Step:  5633 Val-Loss: 1.9691  Val-Acc: 0.32 Time: 32883.70 Local Steps: 1128400\n",
      "32.2228\n",
      "Train: Step:  5642 Val-Loss: 1.9014  Val-Acc: 0.32 Time: 32939.62 Local Steps: 1130200\n",
      "32.434517\n",
      "Train: Step:  5652 Val-Loss: 1.8922  Val-Acc: 0.29 Time: 32993.40 Local Steps: 1132200\n",
      "32.08731\n",
      "Train: Step:  5661 Val-Loss: 1.7916  Val-Acc: 0.34 Time: 33047.26 Local Steps: 1134000\n",
      "31.870388\n",
      "Train: Step:  5670 Val-Loss: 1.9460  Val-Acc: 0.26 Time: 33098.91 Local Steps: 1135800\n",
      "32.525093\n",
      "Train: Step:  5679 Val-Loss: 1.9961  Val-Acc: 0.28 Time: 33149.01 Local Steps: 1137600\n",
      "31.75103\n",
      "Train: Step:  5688 Val-Loss: 1.8761  Val-Acc: 0.33 Time: 33205.45 Local Steps: 1139400\n",
      "31.895805\n",
      "Train: Step:  5698 Val-Loss: 2.0010  Val-Acc: 0.25 Time: 33262.11 Local Steps: 1141400\n",
      "31.888695\n",
      "Train: Step:  5707 Val-Loss: 1.9904  Val-Acc: 0.26 Time: 33315.23 Local Steps: 1143200\n",
      "32.580696\n",
      "Train: Step:  5717 Val-Loss: 1.9428  Val-Acc: 0.26 Time: 33371.17 Local Steps: 1145200\n",
      "32.04741\n",
      "Train: Step:  5726 Val-Loss: 1.8662  Val-Acc: 0.30 Time: 33424.55 Local Steps: 1147000\n",
      "32.169235\n",
      "Train: Step:  5735 Val-Loss: 1.9417  Val-Acc: 0.28 Time: 33479.80 Local Steps: 1148800\n",
      "31.281013\n",
      "Train: Step:  5744 Val-Loss: 1.7933  Val-Acc: 0.32 Time: 33531.75 Local Steps: 1150600\n",
      "31.19251\n",
      "Train: Step:  5753 Val-Loss: 1.8370  Val-Acc: 0.30 Time: 33581.80 Local Steps: 1152400\n",
      "32.039467\n",
      "Train: Step:  5761 Val-Loss: 1.9283  Val-Acc: 0.27 Time: 33634.73 Local Steps: 1154000\n",
      "32.0833\n",
      "Train: Step:  5770 Val-Loss: 1.9497  Val-Acc: 0.22 Time: 33684.73 Local Steps: 1155800\n",
      "32.261497\n",
      "Train: Step:  5779 Val-Loss: 1.8770  Val-Acc: 0.29 Time: 33737.11 Local Steps: 1157600\n",
      "31.515482\n",
      "Train: Step:  5788 Val-Loss: 1.8884  Val-Acc: 0.29 Time: 33789.04 Local Steps: 1159400\n",
      "31.76928\n",
      "Train: Step:  5797 Val-Loss: 1.9049  Val-Acc: 0.27 Time: 33840.48 Local Steps: 1161200\n",
      "31.744976\n",
      "Train: Step:  5806 Val-Loss: 1.8547  Val-Acc: 0.29 Time: 33894.29 Local Steps: 1163000\n",
      "31.474245\n",
      "Train: Step:  5815 Val-Loss: 1.8368  Val-Acc: 0.33 Time: 33947.59 Local Steps: 1164800\n",
      "30.790508\n",
      "Train: Step:  5824 Val-Loss: 1.8620  Val-Acc: 0.30 Time: 33998.89 Local Steps: 1166600\n",
      "31.844296\n",
      "Train: Step:  5833 Val-Loss: 1.9747  Val-Acc: 0.24 Time: 34050.93 Local Steps: 1168400\n",
      "31.151293\n",
      "Train: Step:  5842 Val-Loss: 1.7756  Val-Acc: 0.34 Time: 34101.24 Local Steps: 1170200\n",
      "31.02147\n",
      "Train: Step:  5852 Val-Loss: 1.8576  Val-Acc: 0.31 Time: 34160.84 Local Steps: 1172200\n",
      "32.581894\n",
      "Train: Step:  5861 Val-Loss: 2.0679  Val-Acc: 0.25 Time: 34214.61 Local Steps: 1174000\n",
      "31.086607\n",
      "Train: Step:  5870 Val-Loss: 1.8594  Val-Acc: 0.32 Time: 34266.13 Local Steps: 1175800\n",
      "31.031687\n",
      "Train: Step:  5879 Val-Loss: 1.8651  Val-Acc: 0.27 Time: 34319.96 Local Steps: 1177600\n",
      "31.47913\n",
      "Train: Step:  5888 Val-Loss: 1.8881  Val-Acc: 0.32 Time: 34371.70 Local Steps: 1179400\n",
      "30.8667\n",
      "Train: Step:  5897 Val-Loss: 1.8941  Val-Acc: 0.28 Time: 34424.37 Local Steps: 1181200\n",
      "31.406033\n",
      "Train: Step:  5906 Val-Loss: 1.9336  Val-Acc: 0.29 Time: 34476.98 Local Steps: 1183000\n",
      "31.682178\n",
      "Train: Step:  5914 Val-Loss: 1.8581  Val-Acc: 0.30 Time: 34527.97 Local Steps: 1184600\n",
      "31.916431\n",
      "Train: Step:  5923 Val-Loss: 2.0025  Val-Acc: 0.24 Time: 34579.19 Local Steps: 1186400\n",
      "31.383507\n",
      "Train: Step:  5932 Val-Loss: 1.8894  Val-Acc: 0.29 Time: 34629.78 Local Steps: 1188200\n",
      "30.959541\n",
      "Train: Step:  5940 Val-Loss: 1.8991  Val-Acc: 0.26 Time: 34681.34 Local Steps: 1189800\n",
      "31.406063\n",
      "Train: Step:  5950 Val-Loss: 1.8259  Val-Acc: 0.34 Time: 34735.84 Local Steps: 1191800\n",
      "31.480824\n",
      "Train: Step:  5959 Val-Loss: 2.0216  Val-Acc: 0.22 Time: 34790.41 Local Steps: 1193600\n",
      "30.980158\n",
      "Train: Step:  5968 Val-Loss: 1.8168  Val-Acc: 0.28 Time: 34842.98 Local Steps: 1195400\n",
      "32.813637\n",
      "Train: Step:  5977 Val-Loss: 2.0595  Val-Acc: 0.26 Time: 34894.52 Local Steps: 1197200\n",
      "31.105278\n",
      "Train: Step:  5985 Val-Loss: 1.8609  Val-Acc: 0.30 Time: 34944.75 Local Steps: 1198800\n",
      "31.298662\n",
      "Train: Step:  5995 Val-Loss: 1.8202  Val-Acc: 0.32 Time: 35002.59 Local Steps: 1200800\n",
      "31.883415\n",
      "Train: Step:  6004 Val-Loss: 1.9902  Val-Acc: 0.26 Time: 35054.45 Local Steps: 1202600\n",
      "31.432161\n",
      "Train: Step:  6014 Val-Loss: 1.9054  Val-Acc: 0.26 Time: 35110.11 Local Steps: 1204600\n",
      "30.716839\n",
      "Train: Step:  6022 Val-Loss: 1.8347  Val-Acc: 0.35 Time: 35160.39 Local Steps: 1206200\n",
      "30.85774\n",
      "Train: Step:  6031 Val-Loss: 1.8145  Val-Acc: 0.34 Time: 35214.86 Local Steps: 1208000\n",
      "32.764557\n",
      "Train: Step:  6041 Val-Loss: 1.8818  Val-Acc: 0.31 Time: 35268.18 Local Steps: 1210000\n",
      "32.22602\n",
      "Train: Step:  6050 Val-Loss: 2.1129  Val-Acc: 0.14 Time: 35325.34 Local Steps: 1211800\n",
      "31.646933\n",
      "Train: Step:  6059 Val-Loss: 1.9080  Val-Acc: 0.25 Time: 35376.19 Local Steps: 1213600\n",
      "31.450497\n",
      "Train: Step:  6068 Val-Loss: 1.9780  Val-Acc: 0.26 Time: 35428.03 Local Steps: 1215400\n",
      "30.94218\n",
      "Train: Step:  6077 Val-Loss: 1.8371  Val-Acc: 0.32 Time: 35478.70 Local Steps: 1217200\n",
      "31.064316\n",
      "Train: Step:  6086 Val-Loss: 1.9042  Val-Acc: 0.27 Time: 35533.18 Local Steps: 1219000\n",
      "31.027758\n",
      "Train: Step:  6095 Val-Loss: 1.8218  Val-Acc: 0.33 Time: 35583.40 Local Steps: 1220800\n",
      "31.709059\n",
      "Train: Step:  6105 Val-Loss: 1.8943  Val-Acc: 0.28 Time: 35639.57 Local Steps: 1222800\n",
      "31.079632\n",
      "Train: Step:  6114 Val-Loss: 1.8844  Val-Acc: 0.31 Time: 35691.78 Local Steps: 1224600\n",
      "32.270893\n",
      "Train: Step:  6123 Val-Loss: 2.0802  Val-Acc: 0.24 Time: 35743.84 Local Steps: 1226400\n",
      "32.144783\n",
      "Train: Step:  6133 Val-Loss: 2.0418  Val-Acc: 0.24 Time: 35797.48 Local Steps: 1228400\n",
      "31.72023\n",
      "Train: Step:  6141 Val-Loss: 1.8514  Val-Acc: 0.31 Time: 35848.44 Local Steps: 1230000\n",
      "31.31475\n",
      "Train: Step:  6150 Val-Loss: 1.8729  Val-Acc: 0.34 Time: 35899.02 Local Steps: 1231800\n",
      "32.35795\n",
      "Train: Step:  6159 Val-Loss: 1.9592  Val-Acc: 0.26 Time: 35951.04 Local Steps: 1233600\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "31.697626\n",
      "Train: Step:  6169 Val-Loss: 1.8819  Val-Acc: 0.29 Time: 36007.08 Local Steps: 1235600\n",
      "30.810356\n",
      "Train: Step:  6177 Val-Loss: 1.8347  Val-Acc: 0.30 Time: 36058.25 Local Steps: 1237200\n",
      "31.089684\n",
      "Train: Step:  6185 Val-Loss: 1.9251  Val-Acc: 0.28 Time: 36108.41 Local Steps: 1238800\n",
      "31.116596\n",
      "Train: Step:  6194 Val-Loss: 1.8600  Val-Acc: 0.30 Time: 36158.84 Local Steps: 1240600\n",
      "30.919119\n",
      "Train: Step:  6204 Val-Loss: 1.8214  Val-Acc: 0.32 Time: 36214.70 Local Steps: 1242600\n",
      "32.912876\n",
      "Train: Step:  6213 Val-Loss: 2.0674  Val-Acc: 0.29 Time: 36265.49 Local Steps: 1244400\n",
      "32.81302\n",
      "Train: Step:  6222 Val-Loss: 1.9400  Val-Acc: 0.27 Time: 36317.35 Local Steps: 1246200\n",
      "30.767784\n",
      "Train: Step:  6231 Val-Loss: 1.9067  Val-Acc: 0.26 Time: 36370.21 Local Steps: 1248000\n",
      "31.272375\n",
      "Train: Step:  6240 Val-Loss: 1.9066  Val-Acc: 0.29 Time: 36424.71 Local Steps: 1249800\n",
      "30.898996\n",
      "Train: Step:  6249 Val-Loss: 1.8852  Val-Acc: 0.29 Time: 36475.59 Local Steps: 1251600\n",
      "31.72575\n",
      "Train: Step:  6258 Val-Loss: 1.9623  Val-Acc: 0.30 Time: 36526.60 Local Steps: 1253400\n",
      "30.785366\n",
      "Train: Step:  6267 Val-Loss: 1.8164  Val-Acc: 0.34 Time: 36578.22 Local Steps: 1255200\n",
      "30.522964\n",
      "Train: Step:  6276 Val-Loss: 1.9353  Val-Acc: 0.28 Time: 36628.32 Local Steps: 1257000\n",
      "32.18839\n",
      "Train: Step:  6285 Val-Loss: 1.9261  Val-Acc: 0.23 Time: 36683.90 Local Steps: 1258800\n",
      "30.829126\n",
      "Train: Step:  6294 Val-Loss: 1.8602  Val-Acc: 0.30 Time: 36734.12 Local Steps: 1260600\n",
      "31.445683\n",
      "Train: Step:  6303 Val-Loss: 1.7930  Val-Acc: 0.34 Time: 36787.60 Local Steps: 1262400\n",
      "31.655455\n",
      "Train: Step:  6312 Val-Loss: 1.9533  Val-Acc: 0.24 Time: 36838.38 Local Steps: 1264200\n",
      "33.178207\n",
      "Train: Step:  6321 Val-Loss: 2.0803  Val-Acc: 0.21 Time: 36892.07 Local Steps: 1266000\n",
      "30.930946\n",
      "Train: Step:  6330 Val-Loss: 1.8457  Val-Acc: 0.29 Time: 36943.37 Local Steps: 1267800\n",
      "30.62968\n",
      "Train: Step:  6339 Val-Loss: 1.8620  Val-Acc: 0.29 Time: 37000.27 Local Steps: 1269600\n",
      "31.512466\n",
      "Train: Step:  6348 Val-Loss: 1.9981  Val-Acc: 0.25 Time: 37050.35 Local Steps: 1271400\n",
      "31.407997\n",
      "Train: Step:  6357 Val-Loss: 1.8880  Val-Acc: 0.31 Time: 37103.37 Local Steps: 1273200\n",
      "31.170834\n",
      "Train: Step:  6367 Val-Loss: 1.8330  Val-Acc: 0.31 Time: 37158.41 Local Steps: 1275200\n",
      "31.080349\n",
      "Train: Step:  6376 Val-Loss: 1.8190  Val-Acc: 0.33 Time: 37209.63 Local Steps: 1277000\n",
      "31.598612\n",
      "Train: Step:  6385 Val-Loss: 1.8104  Val-Acc: 0.31 Time: 37264.00 Local Steps: 1278800\n",
      "31.098574\n",
      "Train: Step:  6394 Val-Loss: 1.8500  Val-Acc: 0.34 Time: 37316.88 Local Steps: 1280600\n",
      "31.389519\n",
      "Train: Step:  6403 Val-Loss: 1.9880  Val-Acc: 0.25 Time: 37371.34 Local Steps: 1282400\n",
      "31.651228\n",
      "Train: Step:  6412 Val-Loss: 2.0789  Val-Acc: 0.26 Time: 37425.81 Local Steps: 1284200\n",
      "30.734383\n",
      "Train: Step:  6421 Val-Loss: 1.8171  Val-Acc: 0.35 Time: 37480.20 Local Steps: 1286000\n",
      "31.388355\n",
      "Train: Step:  6431 Val-Loss: 1.9113  Val-Acc: 0.26 Time: 37531.94 Local Steps: 1288000\n",
      "31.579865\n",
      "Train: Step:  6440 Val-Loss: 1.8524  Val-Acc: 0.31 Time: 37585.27 Local Steps: 1289800\n",
      "31.628277\n",
      "Train: Step:  6449 Val-Loss: 2.0376  Val-Acc: 0.22 Time: 37637.27 Local Steps: 1291600\n",
      "30.972427\n",
      "Train: Step:  6458 Val-Loss: 1.8185  Val-Acc: 0.31 Time: 37689.00 Local Steps: 1293400\n",
      "30.57346\n",
      "Train: Step:  6467 Val-Loss: 1.7912  Val-Acc: 0.36 Time: 37742.37 Local Steps: 1295200\n",
      "30.961275\n",
      "Train: Step:  6476 Val-Loss: 1.8558  Val-Acc: 0.30 Time: 37796.59 Local Steps: 1297000\n",
      "32.683426\n",
      "Train: Step:  6485 Val-Loss: 1.9695  Val-Acc: 0.30 Time: 37851.76 Local Steps: 1298800\n",
      "31.382683\n",
      "Train: Step:  6494 Val-Loss: 1.8551  Val-Acc: 0.33 Time: 37902.23 Local Steps: 1300600\n",
      "30.859905\n",
      "Train: Step:  6503 Val-Loss: 1.9368  Val-Acc: 0.25 Time: 37953.65 Local Steps: 1302400\n",
      "32.090137\n",
      "Train: Step:  6511 Val-Loss: 1.9390  Val-Acc: 0.27 Time: 38007.32 Local Steps: 1304000\n",
      "31.39332\n",
      "Train: Step:  6521 Val-Loss: 1.9821  Val-Acc: 0.22 Time: 38060.04 Local Steps: 1306000\n",
      "31.408716\n",
      "Train: Step:  6530 Val-Loss: 1.9107  Val-Acc: 0.31 Time: 38113.34 Local Steps: 1307800\n",
      "31.056625\n",
      "Train: Step:  6539 Val-Loss: 1.8092  Val-Acc: 0.31 Time: 38163.46 Local Steps: 1309600\n",
      "30.59409\n",
      "Train: Step:  6548 Val-Loss: 1.9413  Val-Acc: 0.27 Time: 38217.95 Local Steps: 1311400\n",
      "31.321955\n",
      "Train: Step:  6557 Val-Loss: 1.9822  Val-Acc: 0.27 Time: 38270.56 Local Steps: 1313200\n",
      "31.613678\n",
      "Train: Step:  6566 Val-Loss: 1.9128  Val-Acc: 0.28 Time: 38325.07 Local Steps: 1315000\n"
     ]
    }
   ],
   "source": [
    "start = time.time()\n",
    "\n",
    "log_period = 50 ## Simulation time difference between loggings.\n",
    "#logs, trainers = run(setups, \"mnist_qnn\", log_period, count=client_count)\n",
    "#logs, trainers = run(setups, \"mnist_hetero_qnn\", log_period, count=client_count)\n",
    "logs, trainers = run(setups, \"cifar_10_hetero_qnn\", log_period, count=client_count)\n",
    "#logs, trainers = run(setups, \"tinyimagenet\", log_period, count=client_count)\n",
    "\n",
    "end = time.time()\n",
    "print(f\"Finished in {end - start}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5f0388bf",
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "#plot_trends(logs, x_axis, y_axis, start = 5000)\n",
    "figname = \"cifar10_noniid_n100_svariable\"\n",
    "x_axis, y_axis = \"Time\", \"Loss\"\n",
    "plot_save(logs, x_axis, y_axis, name=figname)\n",
    "\n",
    "x_axis, y_axis = \"Time\", \"Variance\"\n",
    "plot_save(logs, x_axis, y_axis, name=figname)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ed9db203",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "898dc110",
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_save(logs, \"Local steps\", \"Accuracy\", name=figname)\n",
    "plot_save(logs, \"Server steps\", \"Accuracy\", name=figname)\n",
    "plot_save(logs, \"Time\", \"Accuracy\", name=figname)\n",
    "plot_save(logs, \"Local steps\", \"Variance\", name=figname)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "101224db",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
