{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "HkOk1l_44ERM"
   },
   "source": [
    "# Environmental Setup"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "tags": []
   },
   "source": [
    "## Install required packages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 3468,
     "status": "ok",
     "timestamp": 1726839022908,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "5mmqSh3szedt",
    "outputId": "e43c0051-f68f-4455-8dc7-f118b38c14e6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.44.2)\n",
      "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.16.0)\n",
      "Requirement already satisfied: huggingface-hub<1.0,>=0.23.2 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.24.7)\n",
      "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.26.4)\n",
      "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (24.1)\n",
      "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.2)\n",
      "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2024.9.11)\n",
      "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.32.3)\n",
      "Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.4.5)\n",
      "Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.19.1)\n",
      "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.5)\n",
      "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.23.2->transformers) (2024.6.1)\n",
      "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.23.2->transformers) (4.12.2)\n",
      "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.3.2)\n",
      "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.10)\n",
      "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.7)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2024.8.30)\n"
     ]
    }
   ],
   "source": [
    "! pip3 install transformers"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Import required packages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "executionInfo": {
     "elapsed": 385,
     "status": "ok",
     "timestamp": 1726839171077,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "-ODsn-k4YCmI"
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import torch\n",
    "import os\n",
    "import sys\n",
    "import datetime\n",
    "import time\n",
    "import ast\n",
    "from tqdm import tqdm\n",
    "import networkx as nx\n",
    "import numpy as np\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "\n",
    "# Vertex AI Packages\n",
    "import vertexai\n",
    "from vertexai.language_models import TextEmbeddingModel"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2,
     "status": "ok",
     "timestamp": 1726839214696,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "grJZp6ZSAFgx",
    "outputId": "49237209-3a6e-40ab-82a5-9c74045ec3f1"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "09-20-2024_1333\n"
     ]
    }
   ],
   "source": [
    "dt = datetime.datetime.now()\n",
    "datestr = dt.strftime(\"%m-%d-%Y_%H%M\")\n",
    "print(datestr)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "0ZpRswSo3cZh"
   },
   "source": [
    "## Grant drive access for data if working in Colab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 19431,
     "status": "ok",
     "timestamp": 1726839191439,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "ar4O_1tszb8L",
    "outputId": "c9d0bace-6147-4c80-b0af-1b2575d69067"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mounted at /content/drive/\n"
     ]
    }
   ],
   "source": [
    "from google.colab import drive\n",
    "drive.mount('/content/drive/', force_remount=True)\n",
    "sys.path.append('/content/drive/MyDrive/Colab Notebooks/')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {
    "executionInfo": {
     "elapsed": 11550,
     "status": "ok",
     "timestamp": 1726839202987,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "bRrVD8HNJNcy"
   },
   "outputs": [],
   "source": [
    "# if it's Colab runtime, authenticate the user with Google Cloud\n",
    "if \"google.colab\" in sys.modules:\n",
    "    from google.colab import auth\n",
    "\n",
    "    auth.authenticate_user()\n",
    "\n",
    "LOCATION = \"us-central1\"\n",
    "PROJECT_ID = \"synthetic-data-432701\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 7450,
     "status": "ok",
     "timestamp": 1726839210431,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "T4Zm3sxLJM9j",
    "outputId": "b0b8d97c-ba96-4923-f4c5-9059968e06d4"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Operation \"operations/acat.p2-29476227164-0cb33df5-fcca-4082-861f-1b7c5f1e9d96\" finished successfully.\n"
     ]
    }
   ],
   "source": [
    "! gcloud services enable compute.googleapis.com aiplatform.googleapis.com storage.googleapis.com bigquery.googleapis.com --project {PROJECT_ID}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 681,
     "status": "ok",
     "timestamp": 1726839212934,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "a0Yf9E5vzfsU",
    "outputId": "82d33ba3-667b-40f9-f624-c8ef0232cf03"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/content/drive/My Drive/Colab Notebooks/AnnotateGPT\n"
     ]
    }
   ],
   "source": [
    "%cd /content/drive/My Drive/Colab Notebooks/AnnotateGPT/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import Metric\n",
    "from run_Bert_model import model_train_validate_test\n",
    "from embed_text import get_embeddings_wrapper, get_embeddings_task\n",
    "from graph_utils import build_graph, max_cover_sampling, calculate_similarity_threshold\n",
    "import train"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "hPPfRpmnfjWo"
   },
   "source": [
    "# Train and validate BERT base models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {
    "executionInfo": {
     "elapsed": 12236,
     "status": "ok",
     "timestamp": 1726839230064,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "Ptimx4CB_Ml8"
   },
   "outputs": [],
   "source": [
    "NUM_REPS = 5 # number of replications on training models to get mean accuracy / std\n",
    "\n",
    "data_path = \"/content/drive/My Drive/Colab Notebooks/AnnotateGPT/data/\"\n",
    "test_df = pd.read_csv(os.path.join(data_path,\"test.tsv\"),sep='\\t',header=None, names=['similarity','s1'])\n",
    "target_dir = \"/content/drive/My Drive/Colab Notebooks/AnnotateGPT/Results\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "XQtCfaDI3k23"
   },
   "source": [
    "## Real-world training data baseline"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "PiJk76q4fkSK"
   },
   "outputs": [],
   "source": [
    "human_train_df = pd.read_csv(os.path.join(data_path,\"train.tsv\"),sep='\\t',header=None, names=['similarity','s1'])\n",
    "human_dev_df = pd.read_csv(os.path.join(data_path,\"dev.tsv\"),sep='\\t',header=None, names=['similarity','s1'])\n",
    "human_train_df = human_train_df.sample(n=6000, random_state=42) # Random downsample human_train_df to 6000 samples\n",
    "\n",
    "human_results_df = pd.DataFrame(columns=['acc','f1'])\n",
    "for i in range(NUM_REPS):\n",
    "    acc, f1 = train_model(human_train_df, test_df, target_dir, datestr, data=\"human\", k=250, dev_df=human_dev_df)\n",
    "    human_results_df = pd.concat([human_results_df, pd.DataFrame({'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
    "results_save_name = \"human_results.csv\"\n",
    "human_results_df.to_csv(os.path.join(target_dir, results_save_name))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "914qC1ZdCH5f"
   },
   "source": [
    "## Synthetic (zero-shot) training data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "W6Nrc1fW3vtx"
   },
   "source": [
    "### Data Loading"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {
    "executionInfo": {
     "elapsed": 1805,
     "status": "ok",
     "timestamp": 1726839235866,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "0MUw6H3DD5__"
   },
   "outputs": [],
   "source": [
    "syn_data_df = pd.read_csv(os.path.join(data_path,\"PGDG_6k.tsv\"),sep='\\t', names=['s1','similarity'])\n",
    "# remove header row\n",
    "syn_data_df = syn_data_df.iloc[1:]\n",
    "# Convert similarity column to int64\n",
    "syn_data_df['similarity'] = syn_data_df['similarity'].astype('int64')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "9o30KkQi34h0"
   },
   "source": [
    "### Train model on all 6,000 synthetic samples"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 2317591,
     "status": "ok",
     "timestamp": 1726844170548,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "aLYA2Tfbaf-C",
    "outputId": "77925265-3afd-4f1f-ebb1-34f68fe7f78e"
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7659, accuracy: 49.6667%, auc: 0.2795\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0607: 100%|██████████| 338/338 [00:27<00:00, 12.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.1213s, loss = 0.0607, accuracy: 98.2963%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7441s, loss: 0.0190, accuracy: 99.6667%, auc: 0.9993\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7133%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0716s, loss: 0.0083: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0217s, loss = 0.0083, accuracy: 99.8148%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7197s, loss: 0.0008, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7650%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0717s, loss: 0.0061: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0445s, loss = 0.0061, accuracy: 99.8889%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7433s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7622%\n",
      "\n",
      "Accuracy: 76.2%\n",
      "Precision: 80.3%\n",
      "Recall: 76.3%\n",
      "F1: 75.4%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.915     0.579     0.709       912\n",
      "     class_1      0.691     0.946     0.799       909\n",
      "\n",
      "    accuracy                          0.762      1821\n",
      "   macro avg      0.803     0.763     0.754      1821\n",
      "weighted avg      0.803     0.762     0.754      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-11-cfdc10f11d35>:26: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.\n",
      "  all_syn_results_df = pd.concat([all_syn_results_df, pd.DataFrame({'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7409, accuracy: 52.6667%, auc: 0.5057\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0716s, loss: 0.0534: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0165s, loss = 0.0534, accuracy: 98.2778%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7429s, loss: 0.0053, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7825%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0016: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0413s, loss = 0.0016, accuracy: 99.9815%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7435s, loss: 0.0009, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7743%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0003: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0245s, loss = 0.0003, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7428s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7803%\n",
      "\n",
      "Accuracy: 78.0%\n",
      "Precision: 79.9%\n",
      "Recall: 78.1%\n",
      "F1: 77.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.875     0.655     0.749       912\n",
      "     class_1      0.723     0.906     0.805       909\n",
      "\n",
      "    accuracy                          0.780      1821\n",
      "   macro avg      0.799     0.781     0.777      1821\n",
      "weighted avg      0.800     0.780     0.777      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6642, accuracy: 59.5000%, auc: 0.7050\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0538: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0131s, loss = 0.0538, accuracy: 98.6852%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7439s, loss: 0.0035, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7776%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0033: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0186s, loss = 0.0033, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7455s, loss: 0.0004, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7985%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0720s, loss: 0.0004: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0038s, loss = 0.0004, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7441s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7545%\n",
      "\n",
      "Accuracy: 75.5%\n",
      "Precision: 78.6%\n",
      "Recall: 75.5%\n",
      "F1: 74.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.881     0.590     0.707       912\n",
      "     class_1      0.691     0.920     0.789       909\n",
      "\n",
      "    accuracy                          0.755      1821\n",
      "   macro avg      0.786     0.755     0.748      1821\n",
      "weighted avg      0.786     0.755     0.748      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7460, accuracy: 47.5000%, auc: 0.4100\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0523: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0343s, loss = 0.0523, accuracy: 98.4630%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7466s, loss: 0.0009, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7479%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0721s, loss: 0.0044: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0094s, loss = 0.0044, accuracy: 99.8889%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7475s, loss: 0.0455, accuracy: 99.3333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 74.8%\n",
      "Precision: 77.4%\n",
      "Recall: 74.8%\n",
      "F1: 74.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.860     0.593     0.702       912\n",
      "     class_1      0.689     0.903     0.782       909\n",
      "\n",
      "    accuracy                          0.748      1821\n",
      "   macro avg      0.774     0.748     0.742      1821\n",
      "weighted avg      0.775     0.748     0.742      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7023, accuracy: 52.5000%, auc: 0.5603\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0519: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0351s, loss = 0.0519, accuracy: 98.2407%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7457s, loss: 0.0275, accuracy: 99.5000%, auc: 0.9999\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7309%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0121: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0013s, loss = 0.0121, accuracy: 99.7407%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7457s, loss: 0.0021, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7935%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0006: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 26.9998s, loss = 0.0006, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7436s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.8001%\n",
      "\n",
      "Accuracy: 80.0%\n",
      "Precision: 81.4%\n",
      "Recall: 80.0%\n",
      "F1: 79.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.882     0.694     0.777       912\n",
      "     class_1      0.747     0.906     0.819       909\n",
      "\n",
      "    accuracy                          0.800      1821\n",
      "   macro avg      0.814     0.800     0.798      1821\n",
      "weighted avg      0.814     0.800     0.798      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8072, accuracy: 44.5000%, auc: 0.4481\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0488: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0301s, loss = 0.0488, accuracy: 98.5370%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7450s, loss: 0.0050, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7177%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0049: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0034s, loss = 0.0049, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7417s, loss: 0.0006, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7595%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0050: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0203s, loss = 0.0050, accuracy: 99.9074%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7469s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.8056%\n",
      "\n",
      "Accuracy: 80.6%\n",
      "Precision: 80.9%\n",
      "Recall: 80.6%\n",
      "F1: 80.5%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.840     0.755     0.796       912\n",
      "     class_1      0.777     0.856     0.815       909\n",
      "\n",
      "    accuracy                          0.806      1821\n",
      "   macro avg      0.809     0.806     0.805      1821\n",
      "weighted avg      0.809     0.806     0.805      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6889, accuracy: 52.8333%, auc: 0.5903\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0477: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0115s, loss = 0.0477, accuracy: 98.5556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7480s, loss: 0.0012, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7836%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0083: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0004s, loss = 0.0083, accuracy: 99.7963%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7469s, loss: 0.0015, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.8029%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0018: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0000s, loss = 0.0018, accuracy: 99.9815%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7460s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7935%\n",
      "\n",
      "Accuracy: 79.4%\n",
      "Precision: 79.4%\n",
      "Recall: 79.3%\n",
      "F1: 79.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.782     0.816     0.798       912\n",
      "     class_1      0.807     0.771     0.789       909\n",
      "\n",
      "    accuracy                          0.794      1821\n",
      "   macro avg      0.794     0.793     0.793      1821\n",
      "weighted avg      0.794     0.794     0.793      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7187, accuracy: 47.6667%, auc: 0.6158\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0505: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0123s, loss = 0.0505, accuracy: 98.5000%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7478s, loss: 0.0009, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7243%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0060: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0080s, loss = 0.0060, accuracy: 99.8519%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7362s, loss: 0.0028, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 72.4%\n",
      "Precision: 78.8%\n",
      "Recall: 72.5%\n",
      "F1: 70.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.924     0.490     0.640       912\n",
      "     class_1      0.652     0.959     0.776       909\n",
      "\n",
      "    accuracy                          0.724      1821\n",
      "   macro avg      0.788     0.725     0.708      1821\n",
      "weighted avg      0.788     0.724     0.708      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7525, accuracy: 41.3333%, auc: 0.2978\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0594: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0125s, loss = 0.0594, accuracy: 97.9074%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7443s, loss: 0.0013, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7935%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0716s, loss: 0.0046: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0346s, loss = 0.0046, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7436s, loss: 0.0091, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 79.4%\n",
      "Precision: 80.4%\n",
      "Recall: 79.4%\n",
      "F1: 79.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.861     0.701     0.773       912\n",
      "     class_1      0.747     0.887     0.811       909\n",
      "\n",
      "    accuracy                          0.794      1821\n",
      "   macro avg      0.804     0.794     0.792      1821\n",
      "weighted avg      0.804     0.794     0.792      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6724, accuracy: 56.3333%, auc: 0.6621\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0720s, loss: 0.0537: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0135s, loss = 0.0537, accuracy: 98.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7369s, loss: 0.0030, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7847%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0716s, loss: 0.0083: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0423s, loss = 0.0083, accuracy: 99.7963%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7430s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7979%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0715s, loss: 0.0028: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0201s, loss = 0.0028, accuracy: 99.8704%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7425s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.8023%\n",
      "\n",
      "Accuracy: 80.2%\n",
      "Precision: 80.8%\n",
      "Recall: 80.2%\n",
      "F1: 80.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.850     0.735     0.788       912\n",
      "     class_1      0.766     0.870     0.815       909\n",
      "\n",
      "    accuracy                          0.802      1821\n",
      "   macro avg      0.808     0.802     0.801      1821\n",
      "weighted avg      0.808     0.802     0.801      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7155, accuracy: 47.8333%, auc: 0.6238\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0716s, loss: 0.0493: 100%|██████████| 338/338 [00:27<00:00, 12.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0545s, loss = 0.0493, accuracy: 98.4815%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7404s, loss: 0.0042, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7551%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0717s, loss: 0.0018: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0459s, loss = 0.0018, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7412s, loss: 0.0080, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7507%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0717s, loss: 0.0034: 100%|██████████| 338/338 [00:27<00:00, 12.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0613s, loss = 0.0034, accuracy: 99.9444%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7427s, loss: 0.0037, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6875%\n",
      "\n",
      "Accuracy: 68.8%\n",
      "Precision: 74.1%\n",
      "Recall: 68.8%\n",
      "F1: 66.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.855     0.453     0.592       912\n",
      "     class_1      0.627     0.923     0.747       909\n",
      "\n",
      "    accuracy                          0.688      1821\n",
      "   macro avg      0.741     0.688     0.669      1821\n",
      "weighted avg      0.741     0.688     0.669      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7393, accuracy: 47.5000%, auc: 0.4696\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0717s, loss: 0.0519: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0176s, loss = 0.0519, accuracy: 98.5926%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7429s, loss: 0.0071, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7809%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0084: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0261s, loss = 0.0084, accuracy: 99.7963%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7388s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7474%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0720s, loss: 0.0003: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0379s, loss = 0.0003, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7444s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7781%\n",
      "\n",
      "Accuracy: 77.8%\n",
      "Precision: 80.9%\n",
      "Recall: 77.8%\n",
      "F1: 77.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.906     0.622     0.737       912\n",
      "     class_1      0.711     0.935     0.808       909\n",
      "\n",
      "    accuracy                          0.778      1821\n",
      "   macro avg      0.809     0.778     0.773      1821\n",
      "weighted avg      0.809     0.778     0.773      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7448, accuracy: 40.8333%, auc: 0.3663\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0510: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0181s, loss = 0.0510, accuracy: 98.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7368s, loss: 0.0012, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6914%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0721s, loss: 0.0088: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0111s, loss = 0.0088, accuracy: 99.8148%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7339s, loss: 0.0070, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 69.1%\n",
      "Precision: 75.7%\n",
      "Recall: 69.2%\n",
      "F1: 67.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.887     0.440     0.588       912\n",
      "     class_1      0.627     0.944     0.753       909\n",
      "\n",
      "    accuracy                          0.691      1821\n",
      "   macro avg      0.757     0.692     0.671      1821\n",
      "weighted avg      0.757     0.691     0.670      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8827, accuracy: 47.3333%, auc: 0.3105\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0521: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0097s, loss = 0.0521, accuracy: 98.3148%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7384s, loss: 0.0172, accuracy: 99.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7655%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0071: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0350s, loss = 0.0071, accuracy: 99.8333%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7412s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7825%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0721s, loss: 0.0019: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0038s, loss = 0.0019, accuracy: 99.9815%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7431s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7891%\n",
      "\n",
      "Accuracy: 78.9%\n",
      "Precision: 79.3%\n",
      "Recall: 78.9%\n",
      "F1: 78.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.829     0.729     0.776       912\n",
      "     class_1      0.758     0.849     0.801       909\n",
      "\n",
      "    accuracy                          0.789      1821\n",
      "   macro avg      0.793     0.789     0.788      1821\n",
      "weighted avg      0.793     0.789     0.788      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7568, accuracy: 39.5000%, auc: 0.2744\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0615: 100%|██████████| 338/338 [00:27<00:00, 12.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0567s, loss = 0.0615, accuracy: 97.9630%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7442s, loss: 0.0226, accuracy: 99.3333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.8023%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0047: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0003s, loss = 0.0047, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7449s, loss: 0.0003, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7853%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0720s, loss: 0.0027: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0190s, loss = 0.0027, accuracy: 99.9444%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7422s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7748%\n",
      "\n",
      "Accuracy: 77.5%\n",
      "Precision: 81.1%\n",
      "Recall: 77.5%\n",
      "F1: 76.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.918     0.604     0.729       912\n",
      "     class_1      0.704     0.946     0.808       909\n",
      "\n",
      "    accuracy                          0.775      1821\n",
      "   macro avg      0.811     0.775     0.768      1821\n",
      "weighted avg      0.812     0.775     0.768      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6684, accuracy: 56.1667%, auc: 0.7302\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0720s, loss: 0.0486: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0340s, loss = 0.0486, accuracy: 98.5741%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7410s, loss: 0.0020, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7622%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0719s, loss: 0.0023: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0210s, loss = 0.0023, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7407s, loss: 0.0011, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6096%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0007: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0399s, loss = 0.0007, accuracy: 99.9815%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7426s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7886%\n",
      "\n",
      "Accuracy: 78.9%\n",
      "Precision: 81.0%\n",
      "Recall: 78.9%\n",
      "F1: 78.5%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.892     0.658     0.757       912\n",
      "     class_1      0.728     0.920     0.813       909\n",
      "\n",
      "    accuracy                          0.789      1821\n",
      "   macro avg      0.810     0.789     0.785      1821\n",
      "weighted avg      0.810     0.789     0.785      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8079, accuracy: 52.1667%, auc: 0.3787\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0721s, loss: 0.0594: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0147s, loss = 0.0594, accuracy: 97.9630%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7448s, loss: 0.0029, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7364%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0090: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0446s, loss = 0.0090, accuracy: 99.7778%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7416s, loss: 0.0005, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7227%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0004: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0029s, loss = 0.0004, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7433s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7441%\n",
      "\n",
      "Accuracy: 74.4%\n",
      "Precision: 77.7%\n",
      "Recall: 74.4%\n",
      "F1: 73.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.872     0.573     0.692       912\n",
      "     class_1      0.681     0.915     0.781       909\n",
      "\n",
      "    accuracy                          0.744      1821\n",
      "   macro avg      0.777     0.744     0.737      1821\n",
      "weighted avg      0.777     0.744     0.736      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6741, accuracy: 56.5000%, auc: 0.6211\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0534: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0336s, loss = 0.0534, accuracy: 98.5370%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7481s, loss: 0.0119, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7781%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0047: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 26.9993s, loss = 0.0047, accuracy: 99.8148%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7451s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7908%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0002: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0012s, loss = 0.0002, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7464s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7935%\n",
      "\n",
      "Accuracy: 79.4%\n",
      "Precision: 80.5%\n",
      "Recall: 79.4%\n",
      "F1: 79.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.866     0.695     0.771       912\n",
      "     class_1      0.745     0.892     0.812       909\n",
      "\n",
      "    accuracy                          0.794      1821\n",
      "   macro avg      0.805     0.794     0.792      1821\n",
      "weighted avg      0.806     0.794     0.792      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7411, accuracy: 40.8333%, auc: 0.2311\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0572: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0207s, loss = 0.0572, accuracy: 98.3704%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7389s, loss: 0.0010, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.8100%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0098: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0038s, loss = 0.0098, accuracy: 99.7963%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7367s, loss: 0.0004, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7897%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0038: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0177s, loss = 0.0038, accuracy: 99.9259%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7465s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.8210%\n",
      "\n",
      "Accuracy: 82.1%\n",
      "Precision: 82.2%\n",
      "Recall: 82.1%\n",
      "F1: 82.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.801     0.854     0.827       912\n",
      "     class_1      0.843     0.788     0.815       909\n",
      "\n",
      "    accuracy                          0.821      1821\n",
      "   macro avg      0.822     0.821     0.821      1821\n",
      "weighted avg      0.822     0.821     0.821      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7710, accuracy: 47.3333%, auc: 0.4317\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0445: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0181s, loss = 0.0445, accuracy: 98.6852%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7462s, loss: 0.0146, accuracy: 99.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7853%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0055: 100%|██████████| 338/338 [00:27<00:00, 12.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0340s, loss = 0.0055, accuracy: 99.8704%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7436s, loss: 0.0064, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6914%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0036: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 26.9988s, loss = 0.0036, accuracy: 99.8889%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7457s, loss: 0.0057, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7721%\n",
      "\n",
      "Accuracy: 77.2%\n",
      "Precision: 79.3%\n",
      "Recall: 77.2%\n",
      "F1: 76.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.715     0.906     0.799       912\n",
      "     class_1      0.871     0.638     0.737       909\n",
      "\n",
      "    accuracy                          0.772      1821\n",
      "   macro avg      0.793     0.772     0.768      1821\n",
      "weighted avg      0.793     0.772     0.768      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7940, accuracy: 44.3333%, auc: 0.3158\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0577: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0170s, loss = 0.0577, accuracy: 98.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7450s, loss: 0.0093, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7765%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0037: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 26.9997s, loss = 0.0037, accuracy: 99.9444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7468s, loss: 0.0145, accuracy: 99.6667%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 77.6%\n",
      "Precision: 77.7%\n",
      "Recall: 77.6%\n",
      "F1: 77.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.769     0.791     0.780       912\n",
      "     class_1      0.784     0.762     0.773       909\n",
      "\n",
      "    accuracy                          0.776      1821\n",
      "   macro avg      0.777     0.776     0.776      1821\n",
      "weighted avg      0.777     0.776     0.776      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7102, accuracy: 47.5000%, auc: 0.4286\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0547: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0112s, loss = 0.0547, accuracy: 98.1667%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7457s, loss: 0.0020, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.8051%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0039: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0242s, loss = 0.0039, accuracy: 99.9259%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7460s, loss: 0.0005, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7414%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0012: 100%|██████████| 338/338 [00:26<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 26.9998s, loss = 0.0012, accuracy: 99.9815%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7454s, loss: 0.0001, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7869%\n",
      "\n",
      "Accuracy: 78.7%\n",
      "Precision: 79.9%\n",
      "Recall: 78.7%\n",
      "F1: 78.5%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.739     0.888     0.807       912\n",
      "     class_1      0.859     0.685     0.763       909\n",
      "\n",
      "    accuracy                          0.787      1821\n",
      "   macro avg      0.799     0.787     0.785      1821\n",
      "weighted avg      0.799     0.787     0.785      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6811, accuracy: 58.0000%, auc: 0.6413\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0483: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0140s, loss = 0.0483, accuracy: 98.7407%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7462s, loss: 0.0131, accuracy: 99.8333%, auc: 0.9999\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7595%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0062: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0043s, loss = 0.0062, accuracy: 99.8519%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7414s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7683%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0032: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0193s, loss = 0.0032, accuracy: 99.8889%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.7453s, loss: 0.0002, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7672%\n",
      "\n",
      "Accuracy: 76.7%\n",
      "Precision: 78.7%\n",
      "Recall: 76.7%\n",
      "F1: 76.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.863     0.636     0.732       912\n",
      "     class_1      0.711     0.899     0.794       909\n",
      "\n",
      "    accuracy                          0.767      1821\n",
      "   macro avg      0.787     0.767     0.763      1821\n",
      "weighted avg      0.787     0.767     0.763      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6839, accuracy: 55.1667%, auc: 0.6106\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0726s, loss: 0.0471: 100%|██████████| 338/338 [00:27<00:00, 12.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.1516s, loss = 0.0471, accuracy: 98.6481%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7464s, loss: 0.0009, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7315%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0026: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0204s, loss = 0.0026, accuracy: 99.9630%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7413s, loss: 0.0032, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 73.1%\n",
      "Precision: 78.5%\n",
      "Recall: 73.2%\n",
      "F1: 71.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.909     0.515     0.658       912\n",
      "     class_1      0.661     0.948     0.779       909\n",
      "\n",
      "    accuracy                          0.731      1821\n",
      "   macro avg      0.785     0.732     0.718      1821\n",
      "weighted avg      0.785     0.731     0.718      1821\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7100, accuracy: 49.1667%, auc: 0.4731\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0723s, loss: 0.0536: 100%|██████████| 338/338 [00:27<00:00, 12.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0112s, loss = 0.0536, accuracy: 98.3704%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.7450s, loss: 0.0014, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7144%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.0722s, loss: 0.0066: 100%|██████████| 338/338 [00:27<00:00, 12.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 27.0046s, loss = 0.0066, accuracy: 99.8519%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.7427s, loss: 0.0019, accuracy: 99.8333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 71.4%\n",
      "Precision: 77.9%\n",
      "Recall: 71.5%\n",
      "F1: 69.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.914     0.475     0.625       912\n",
      "     class_1      0.644     0.955     0.770       909\n",
      "\n",
      "    accuracy                          0.714      1821\n",
      "   macro avg      0.779     0.715     0.697      1821\n",
      "weighted avg      0.779     0.714     0.697      1821\n",
      "\n"
     ]
    }
   ],
   "source": [
    "all_syn_results_df = pd.DataFrame(columns=['acc','f1'])\n",
    "for i in range(NUM_REPS):\n",
    "    acc, f1 = train_model(syn_data_df, test_df, target_dir, datestr, data=\"all syn\")\n",
    "    all_syn_results_df = pd.concat([all_syn_results_df, pd.DataFrame({'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
    "\n",
    "results_save_name = f\"all_syn_results-f{datestr}.csv\"\n",
    "all_syn_results_df.to_csv(os.path.join(target_dir, results_save_name))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "2iCFJ1p-3-DO"
   },
   "source": [
    "## Downsampling of \"representative\" synthetic data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "EXnz8WcPGn7r"
   },
   "source": [
    "### Check for / get embedding data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# if \"syn_data_embeddings.tsv\" exists, load it\n",
    "if os.path.exists(os.path.join(data_path,\"syn_data_embeddings.tsv\")):\n",
    "    syn_data_df = pd.read_csv(os.path.join(data_path,\"syn_data_embeddings.tsv\"),sep='\\t')\n",
    "    syn_data_df['similarity'] = syn_data_df['similarity'].astype('int64')\n",
    "    syn_data_df['embedding'] = syn_data_df['embedding'].apply(ast.literal_eval)\n",
    "else:\n",
    "    # get embeddings for the question titles and add them as \"embedding\" column\n",
    "    embeddings = get_embeddings_wrapper(syn_data_df['s1'])\n",
    "    # append synthetic reviw with corresponding embedding in dataframe and label of whether the review is positive or negative, as well as the genre\n",
    "    syn_data_df = pd.DataFrame({\"s1\": syn_data_df['s1'], \"similarity\": syn_data_df['similarity'], \"embedding\": embeddings})\n",
    "    syn_data_df.to_csv(os.path.join(data_path,\"syn_data_embeddings.tsv\"), sep='\\t')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "tZStBJTICJTX"
   },
   "outputs": [],
   "source": [
    "pos_syn_df = syn_data_df[syn_data_df['similarity'] == 1]\n",
    "neg_syn_df = syn_data_df[syn_data_df['similarity'] == 0]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "IFtHYSJStSEM"
   },
   "source": [
    "### Train model on $k$-Max Cover Selected Samples\n",
    "\n",
    "Postitive and negative samples are segregated and $\\frac{k}{2}$ points are selected using the max-cover implementation for each class then recombined."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "executionInfo": {
     "elapsed": 442,
     "status": "ok",
     "timestamp": 1726542845838,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "Shuu7QWEEHv5",
    "outputId": "8d1916c2-13bc-4baa-c3f1-8ee565bd3c02"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[100, 400, 700, 1000, 1300, 1600, 1900, 2200, 2500, 2800, 3100]\n"
     ]
    }
   ],
   "source": [
    "# Set Ks from 100 to 1200\n",
    "Ks = list(range(100, 3300, 300))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "N397u-FIqciH",
    "outputId": "48951ef7-377e-411e-f71f-6a48b50cfe9a"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "K: 100\n",
      "sim: 0.5\n",
      "sim: 0.75\n",
      "sim: 0.625\n",
      "sim: 0.6875\n",
      "sim: 0.5\n",
      "sim: 0.75\n",
      "sim: 0.875\n",
      "sim: 0.8125\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8145, accuracy: 20.0000%, auc: 0.7500\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.5823: 100%|██████████| 6/6 [00:00<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.0032s, loss = 0.5823, accuracy: 74.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0210s, loss: 0.3775, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5283%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1408s, loss: 0.4598: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9242s, loss = 0.4598, accuracy: 84.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0215s, loss: 0.3077, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5360%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1417s, loss: 0.2961: 100%|██████████| 6/6 [00:00<00:00,  6.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9290s, loss = 0.2961, accuracy: 96.6667%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0244s, loss: 0.1825, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6019%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1413s, loss: 0.2081: 100%|██████████| 6/6 [00:00<00:00,  6.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9256s, loss = 0.2081, accuracy: 97.7778%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0243s, loss: 0.1273, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6436%\n",
      "\n",
      "* Training epoch 5:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1410s, loss: 0.1477: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9285s, loss = 0.1477, accuracy: 100.0000%\n",
      "* Validation for epoch 5:\n",
      "-> Valid. time: 0.0238s, loss: 0.0977, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 5:\n",
      "Test accuracy: 0.6540%\n",
      "\n",
      "* Training epoch 6:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1401s, loss: 0.1002: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9221s, loss = 0.1002, accuracy: 100.0000%\n",
      "* Validation for epoch 6:\n",
      "-> Valid. time: 0.0219s, loss: 0.0774, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 6:\n",
      "Test accuracy: 0.6365%\n",
      "\n",
      "* Training epoch 7:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1389s, loss: 0.0883: 100%|██████████| 6/6 [00:00<00:00,  6.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9121s, loss = 0.0883, accuracy: 100.0000%\n",
      "* Validation for epoch 7:\n",
      "-> Valid. time: 0.0214s, loss: 0.0612, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 7:\n",
      "Test accuracy: 0.6535%\n",
      "\n",
      "* Training epoch 8:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0655: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9155s, loss = 0.0655, accuracy: 100.0000%\n",
      "* Validation for epoch 8:\n",
      "-> Valid. time: 0.0218s, loss: 0.0499, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 8:\n",
      "Test accuracy: 0.6798%\n",
      "\n",
      "* Training epoch 9:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0570: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9142s, loss = 0.0570, accuracy: 100.0000%\n",
      "* Validation for epoch 9:\n",
      "-> Valid. time: 0.0215s, loss: 0.0428, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 9:\n",
      "Test accuracy: 0.6897%\n",
      "\n",
      "* Training epoch 10:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1410s, loss: 0.0499: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9285s, loss = 0.0499, accuracy: 100.0000%\n",
      "* Validation for epoch 10:\n",
      "-> Valid. time: 0.0224s, loss: 0.0379, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 10:\n",
      "Test accuracy: 0.6919%\n",
      "\n",
      "* Training epoch 11:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1420s, loss: 0.0460: 100%|██████████| 6/6 [00:00<00:00,  6.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9311s, loss = 0.0460, accuracy: 100.0000%\n",
      "* Validation for epoch 11:\n",
      "-> Valid. time: 0.0231s, loss: 0.0344, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 11:\n",
      "Test accuracy: 0.6875%\n",
      "\n",
      "* Training epoch 12:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1390s, loss: 0.0430: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9138s, loss = 0.0430, accuracy: 100.0000%\n",
      "* Validation for epoch 12:\n",
      "-> Valid. time: 0.0231s, loss: 0.0318, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 12:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 13:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1388s, loss: 0.0387: 100%|██████████| 6/6 [00:00<00:00,  6.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9127s, loss = 0.0387, accuracy: 100.0000%\n",
      "* Validation for epoch 13:\n",
      "-> Valid. time: 0.0240s, loss: 0.0298, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 13:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 14:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1400s, loss: 0.0374: 100%|██████████| 6/6 [00:00<00:00,  6.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9197s, loss = 0.0374, accuracy: 100.0000%\n",
      "* Validation for epoch 14:\n",
      "-> Valid. time: 0.0247s, loss: 0.0282, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 14:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 15:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1405s, loss: 0.0329: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9246s, loss = 0.0329, accuracy: 100.0000%\n",
      "* Validation for epoch 15:\n",
      "-> Valid. time: 0.0228s, loss: 0.0270, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 15:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 16:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0338: 100%|██████████| 6/6 [00:00<00:00,  6.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9258s, loss = 0.0338, accuracy: 100.0000%\n",
      "* Validation for epoch 16:\n",
      "-> Valid. time: 0.0218s, loss: 0.0260, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 16:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 17:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1392s, loss: 0.0319: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9176s, loss = 0.0319, accuracy: 100.0000%\n",
      "* Validation for epoch 17:\n",
      "-> Valid. time: 0.0236s, loss: 0.0252, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 17:\n",
      "Test accuracy: 0.6820%\n",
      "\n",
      "* Training epoch 18:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1402s, loss: 0.0309: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9235s, loss = 0.0309, accuracy: 100.0000%\n",
      "* Validation for epoch 18:\n",
      "-> Valid. time: 0.0228s, loss: 0.0246, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 18:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 19:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0309: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9186s, loss = 0.0309, accuracy: 100.0000%\n",
      "* Validation for epoch 19:\n",
      "-> Valid. time: 0.0222s, loss: 0.0240, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 19:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 20:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1408s, loss: 0.0306: 100%|██████████| 6/6 [00:00<00:00,  6.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9293s, loss = 0.0306, accuracy: 100.0000%\n",
      "* Validation for epoch 20:\n",
      "-> Valid. time: 0.0228s, loss: 0.0235, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 20:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 21:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1400s, loss: 0.0300: 100%|██████████| 6/6 [00:00<00:00,  6.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9237s, loss = 0.0300, accuracy: 100.0000%\n",
      "* Validation for epoch 21:\n",
      "-> Valid. time: 0.0229s, loss: 0.0231, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 21:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 22:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1411s, loss: 0.0291: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9256s, loss = 0.0291, accuracy: 100.0000%\n",
      "* Validation for epoch 22:\n",
      "-> Valid. time: 0.0217s, loss: 0.0228, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 22:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 23:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1405s, loss: 0.0290: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9251s, loss = 0.0290, accuracy: 100.0000%\n",
      "* Validation for epoch 23:\n",
      "-> Valid. time: 0.0254s, loss: 0.0225, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 23:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 24:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.0279: 100%|██████████| 6/6 [00:00<00:00,  6.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9189s, loss = 0.0279, accuracy: 100.0000%\n",
      "* Validation for epoch 24:\n",
      "-> Valid. time: 0.0209s, loss: 0.0223, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 24:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 25:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1397s, loss: 0.0289: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9170s, loss = 0.0289, accuracy: 100.0000%\n",
      "* Validation for epoch 25:\n",
      "-> Valid. time: 0.0216s, loss: 0.0220, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 25:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 26:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0264: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9166s, loss = 0.0264, accuracy: 100.0000%\n",
      "* Validation for epoch 26:\n",
      "-> Valid. time: 0.0225s, loss: 0.0219, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 26:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 27:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1393s, loss: 0.0262: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9180s, loss = 0.0262, accuracy: 100.0000%\n",
      "* Validation for epoch 27:\n",
      "-> Valid. time: 0.0239s, loss: 0.0217, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 27:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 28:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1417s, loss: 0.0270: 100%|██████████| 6/6 [00:00<00:00,  6.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9295s, loss = 0.0270, accuracy: 100.0000%\n",
      "* Validation for epoch 28:\n",
      "-> Valid. time: 0.0228s, loss: 0.0216, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 28:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 29:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1390s, loss: 0.0282: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9175s, loss = 0.0282, accuracy: 100.0000%\n",
      "* Validation for epoch 29:\n",
      "-> Valid. time: 0.0244s, loss: 0.0215, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 29:\n",
      "Test accuracy: 0.6842%\n",
      "\n",
      "* Training epoch 30:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1400s, loss: 0.0270: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9211s, loss = 0.0270, accuracy: 100.0000%\n",
      "* Validation for epoch 30:\n",
      "-> Valid. time: 0.0241s, loss: 0.0214, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 30:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 31:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1391s, loss: 0.0264: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9144s, loss = 0.0264, accuracy: 100.0000%\n",
      "* Validation for epoch 31:\n",
      "-> Valid. time: 0.0229s, loss: 0.0213, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 31:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 32:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1411s, loss: 0.0268: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9278s, loss = 0.0268, accuracy: 100.0000%\n",
      "* Validation for epoch 32:\n",
      "-> Valid. time: 0.0240s, loss: 0.0213, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 32:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 33:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1386s, loss: 0.0265: 100%|██████████| 6/6 [00:00<00:00,  6.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9115s, loss = 0.0265, accuracy: 100.0000%\n",
      "* Validation for epoch 33:\n",
      "-> Valid. time: 0.0236s, loss: 0.0212, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 33:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 34:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1397s, loss: 0.0273: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9198s, loss = 0.0273, accuracy: 100.0000%\n",
      "* Validation for epoch 34:\n",
      "-> Valid. time: 0.0235s, loss: 0.0212, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 34:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 35:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0284: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9157s, loss = 0.0284, accuracy: 100.0000%\n",
      "* Validation for epoch 35:\n",
      "-> Valid. time: 0.0218s, loss: 0.0211, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 35:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 36:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0274: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9157s, loss = 0.0274, accuracy: 100.0000%\n",
      "* Validation for epoch 36:\n",
      "-> Valid. time: 0.0222s, loss: 0.0211, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 36:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 37:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1396s, loss: 0.0262: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9147s, loss = 0.0262, accuracy: 100.0000%\n",
      "* Validation for epoch 37:\n",
      "-> Valid. time: 0.0220s, loss: 0.0210, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 37:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 38:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1389s, loss: 0.0268: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9153s, loss = 0.0268, accuracy: 100.0000%\n",
      "* Validation for epoch 38:\n",
      "-> Valid. time: 0.0229s, loss: 0.0210, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 38:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 39:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1411s, loss: 0.0268: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9263s, loss = 0.0268, accuracy: 100.0000%\n",
      "* Validation for epoch 39:\n",
      "-> Valid. time: 0.0213s, loss: 0.0210, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 39:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 40:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1407s, loss: 0.0266: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9265s, loss = 0.0266, accuracy: 100.0000%\n",
      "* Validation for epoch 40:\n",
      "-> Valid. time: 0.0229s, loss: 0.0210, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 40:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 41:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1390s, loss: 0.0269: 100%|██████████| 6/6 [00:00<00:00,  6.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9133s, loss = 0.0269, accuracy: 100.0000%\n",
      "* Validation for epoch 41:\n",
      "-> Valid. time: 0.0235s, loss: 0.0209, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 41:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 42:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0262: 100%|██████████| 6/6 [00:00<00:00,  6.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9206s, loss = 0.0262, accuracy: 100.0000%\n",
      "* Validation for epoch 42:\n",
      "-> Valid. time: 0.0221s, loss: 0.0209, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 42:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 43:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1393s, loss: 0.0278: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9132s, loss = 0.0278, accuracy: 100.0000%\n",
      "* Validation for epoch 43:\n",
      "-> Valid. time: 0.0240s, loss: 0.0209, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 43:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 44:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1420s, loss: 0.0263: 100%|██████████| 6/6 [00:00<00:00,  6.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9345s, loss = 0.0263, accuracy: 100.0000%\n",
      "* Validation for epoch 44:\n",
      "-> Valid. time: 0.0230s, loss: 0.0208, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 44:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 45:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1396s, loss: 0.0270: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9173s, loss = 0.0270, accuracy: 100.0000%\n",
      "* Validation for epoch 45:\n",
      "-> Valid. time: 0.0223s, loss: 0.0208, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 45:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 46:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1396s, loss: 0.0264: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9172s, loss = 0.0264, accuracy: 100.0000%\n",
      "* Validation for epoch 46:\n",
      "-> Valid. time: 0.0235s, loss: 0.0208, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 46:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 47:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1384s, loss: 0.0277: 100%|██████████| 6/6 [00:00<00:00,  6.62it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9099s, loss = 0.0277, accuracy: 100.0000%\n",
      "* Validation for epoch 47:\n",
      "-> Valid. time: 0.0234s, loss: 0.0208, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 47:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 48:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1391s, loss: 0.0267: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9146s, loss = 0.0267, accuracy: 100.0000%\n",
      "* Validation for epoch 48:\n",
      "-> Valid. time: 0.0217s, loss: 0.0207, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 48:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 49:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1412s, loss: 0.0258: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9286s, loss = 0.0258, accuracy: 100.0000%\n",
      "* Validation for epoch 49:\n",
      "-> Valid. time: 0.0232s, loss: 0.0207, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 49:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 50:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.0263: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9212s, loss = 0.0263, accuracy: 100.0000%\n",
      "* Validation for epoch 50:\n",
      "-> Valid. time: 0.0255s, loss: 0.0207, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 50:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 51:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1415s, loss: 0.0291: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9283s, loss = 0.0291, accuracy: 100.0000%\n",
      "* Validation for epoch 51:\n",
      "-> Valid. time: 0.0229s, loss: 0.0206, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 51:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 52:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1402s, loss: 0.0257: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9208s, loss = 0.0257, accuracy: 100.0000%\n",
      "* Validation for epoch 52:\n",
      "-> Valid. time: 0.0223s, loss: 0.0206, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 52:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 53:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0264: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9156s, loss = 0.0264, accuracy: 100.0000%\n",
      "* Validation for epoch 53:\n",
      "-> Valid. time: 0.0230s, loss: 0.0206, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 53:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 54:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0262: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9253s, loss = 0.0262, accuracy: 100.0000%\n",
      "* Validation for epoch 54:\n",
      "-> Valid. time: 0.0219s, loss: 0.0206, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 54:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 55:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1401s, loss: 0.0259: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9191s, loss = 0.0259, accuracy: 100.0000%\n",
      "* Validation for epoch 55:\n",
      "-> Valid. time: 0.0218s, loss: 0.0205, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 55:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 56:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1396s, loss: 0.0262: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9187s, loss = 0.0262, accuracy: 100.0000%\n",
      "* Validation for epoch 56:\n",
      "-> Valid. time: 0.0219s, loss: 0.0205, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 56:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 57:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1414s, loss: 0.0265: 100%|██████████| 6/6 [00:00<00:00,  6.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9315s, loss = 0.0265, accuracy: 100.0000%\n",
      "* Validation for epoch 57:\n",
      "-> Valid. time: 0.0229s, loss: 0.0205, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 57:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 58:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1413s, loss: 0.0276: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9284s, loss = 0.0276, accuracy: 100.0000%\n",
      "* Validation for epoch 58:\n",
      "-> Valid. time: 0.0227s, loss: 0.0204, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 58:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 59:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.0255: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9177s, loss = 0.0255, accuracy: 100.0000%\n",
      "* Validation for epoch 59:\n",
      "-> Valid. time: 0.0213s, loss: 0.0204, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 59:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 60:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1417s, loss: 0.0259: 100%|██████████| 6/6 [00:00<00:00,  6.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9300s, loss = 0.0259, accuracy: 100.0000%\n",
      "* Validation for epoch 60:\n",
      "-> Valid. time: 0.0244s, loss: 0.0204, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 60:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 61:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1411s, loss: 0.0256: 100%|██████████| 6/6 [00:00<00:00,  6.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9276s, loss = 0.0256, accuracy: 100.0000%\n",
      "* Validation for epoch 61:\n",
      "-> Valid. time: 0.0225s, loss: 0.0203, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 61:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 62:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0274: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9279s, loss = 0.0274, accuracy: 100.0000%\n",
      "* Validation for epoch 62:\n",
      "-> Valid. time: 0.0228s, loss: 0.0203, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 62:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 63:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1410s, loss: 0.0265: 100%|██████████| 6/6 [00:00<00:00,  6.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9276s, loss = 0.0265, accuracy: 100.0000%\n",
      "* Validation for epoch 63:\n",
      "-> Valid. time: 0.0257s, loss: 0.0203, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 63:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 64:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0261: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9164s, loss = 0.0261, accuracy: 100.0000%\n",
      "* Validation for epoch 64:\n",
      "-> Valid. time: 0.0218s, loss: 0.0202, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 64:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 65:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1414s, loss: 0.0263: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9257s, loss = 0.0263, accuracy: 100.0000%\n",
      "* Validation for epoch 65:\n",
      "-> Valid. time: 0.0214s, loss: 0.0202, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 65:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 66:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.0245: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9160s, loss = 0.0245, accuracy: 100.0000%\n",
      "* Validation for epoch 66:\n",
      "-> Valid. time: 0.0213s, loss: 0.0201, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 66:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 67:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1403s, loss: 0.0259: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9220s, loss = 0.0259, accuracy: 100.0000%\n",
      "* Validation for epoch 67:\n",
      "-> Valid. time: 0.0214s, loss: 0.0201, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 67:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 68:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1392s, loss: 0.0259: 100%|██████████| 6/6 [00:00<00:00,  6.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9114s, loss = 0.0259, accuracy: 100.0000%\n",
      "* Validation for epoch 68:\n",
      "-> Valid. time: 0.0223s, loss: 0.0201, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 68:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 69:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0252: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9231s, loss = 0.0252, accuracy: 100.0000%\n",
      "* Validation for epoch 69:\n",
      "-> Valid. time: 0.0213s, loss: 0.0200, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 69:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 70:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1406s, loss: 0.0255: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9207s, loss = 0.0255, accuracy: 100.0000%\n",
      "* Validation for epoch 70:\n",
      "-> Valid. time: 0.0215s, loss: 0.0200, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 70:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 71:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1407s, loss: 0.0259: 100%|██████████| 6/6 [00:00<00:00,  6.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9214s, loss = 0.0259, accuracy: 100.0000%\n",
      "* Validation for epoch 71:\n",
      "-> Valid. time: 0.0217s, loss: 0.0200, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 71:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 72:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1388s, loss: 0.0275: 100%|██████████| 6/6 [00:00<00:00,  6.62it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9129s, loss = 0.0275, accuracy: 100.0000%\n",
      "* Validation for epoch 72:\n",
      "-> Valid. time: 0.0228s, loss: 0.0199, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 72:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 73:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1393s, loss: 0.0241: 100%|██████████| 6/6 [00:00<00:00,  6.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9130s, loss = 0.0241, accuracy: 100.0000%\n",
      "* Validation for epoch 73:\n",
      "-> Valid. time: 0.0247s, loss: 0.0199, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 73:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 74:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1393s, loss: 0.0251: 100%|██████████| 6/6 [00:00<00:00,  6.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9118s, loss = 0.0251, accuracy: 100.0000%\n",
      "* Validation for epoch 74:\n",
      "-> Valid. time: 0.0234s, loss: 0.0199, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 74:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 75:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1413s, loss: 0.0256: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9242s, loss = 0.0256, accuracy: 100.0000%\n",
      "* Validation for epoch 75:\n",
      "-> Valid. time: 0.0215s, loss: 0.0198, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 75:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 76:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1403s, loss: 0.0250: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9174s, loss = 0.0250, accuracy: 100.0000%\n",
      "* Validation for epoch 76:\n",
      "-> Valid. time: 0.0214s, loss: 0.0198, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 76:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 77:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1397s, loss: 0.0268: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9175s, loss = 0.0268, accuracy: 100.0000%\n",
      "* Validation for epoch 77:\n",
      "-> Valid. time: 0.0214s, loss: 0.0198, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 77:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 78:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1403s, loss: 0.0255: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9212s, loss = 0.0255, accuracy: 100.0000%\n",
      "* Validation for epoch 78:\n",
      "-> Valid. time: 0.0218s, loss: 0.0198, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 78:\n",
      "Test accuracy: 0.6826%\n",
      "\n",
      "* Training epoch 79:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1397s, loss: 0.0246: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9134s, loss = 0.0246, accuracy: 100.0000%\n",
      "* Validation for epoch 79:\n",
      "-> Valid. time: 0.0212s, loss: 0.0197, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 79:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 80:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0248: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9236s, loss = 0.0248, accuracy: 100.0000%\n",
      "* Validation for epoch 80:\n",
      "-> Valid. time: 0.0214s, loss: 0.0197, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 80:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 81:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0257: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9147s, loss = 0.0257, accuracy: 100.0000%\n",
      "* Validation for epoch 81:\n",
      "-> Valid. time: 0.0254s, loss: 0.0197, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 81:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 82:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1412s, loss: 0.0250: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9248s, loss = 0.0250, accuracy: 100.0000%\n",
      "* Validation for epoch 82:\n",
      "-> Valid. time: 0.0213s, loss: 0.0196, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 82:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 83:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1394s, loss: 0.0251: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9133s, loss = 0.0251, accuracy: 100.0000%\n",
      "* Validation for epoch 83:\n",
      "-> Valid. time: 0.0244s, loss: 0.0196, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 83:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 84:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1407s, loss: 0.0249: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9212s, loss = 0.0249, accuracy: 100.0000%\n",
      "* Validation for epoch 84:\n",
      "-> Valid. time: 0.0218s, loss: 0.0196, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 84:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 85:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1397s, loss: 0.0238: 100%|██████████| 6/6 [00:00<00:00,  6.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9134s, loss = 0.0238, accuracy: 100.0000%\n",
      "* Validation for epoch 85:\n",
      "-> Valid. time: 0.0225s, loss: 0.0195, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 85:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 86:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1407s, loss: 0.0243: 100%|██████████| 6/6 [00:00<00:00,  6.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9214s, loss = 0.0243, accuracy: 100.0000%\n",
      "* Validation for epoch 86:\n",
      "-> Valid. time: 0.0219s, loss: 0.0195, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 86:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 87:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1404s, loss: 0.0256: 100%|██████████| 6/6 [00:00<00:00,  6.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9192s, loss = 0.0256, accuracy: 100.0000%\n",
      "* Validation for epoch 87:\n",
      "-> Valid. time: 0.0219s, loss: 0.0195, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 87:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 88:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1405s, loss: 0.0253: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9234s, loss = 0.0253, accuracy: 100.0000%\n",
      "* Validation for epoch 88:\n",
      "-> Valid. time: 0.0221s, loss: 0.0195, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 88:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 89:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1404s, loss: 0.0236: 100%|██████████| 6/6 [00:00<00:00,  6.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9201s, loss = 0.0236, accuracy: 100.0000%\n",
      "* Validation for epoch 89:\n",
      "-> Valid. time: 0.0225s, loss: 0.0194, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 89:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 90:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.0252: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9163s, loss = 0.0252, accuracy: 100.0000%\n",
      "* Validation for epoch 90:\n",
      "-> Valid. time: 0.0212s, loss: 0.0194, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 90:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 91:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1409s, loss: 0.0230: 100%|██████████| 6/6 [00:00<00:00,  6.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9214s, loss = 0.0230, accuracy: 100.0000%\n",
      "* Validation for epoch 91:\n",
      "-> Valid. time: 0.0210s, loss: 0.0194, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 91:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 92:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1410s, loss: 0.0233: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9241s, loss = 0.0233, accuracy: 100.0000%\n",
      "* Validation for epoch 92:\n",
      "-> Valid. time: 0.0210s, loss: 0.0193, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 92:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 93:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1401s, loss: 0.0246: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9226s, loss = 0.0246, accuracy: 100.0000%\n",
      "* Validation for epoch 93:\n",
      "-> Valid. time: 0.0227s, loss: 0.0193, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 93:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 94:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1411s, loss: 0.0244: 100%|██████████| 6/6 [00:00<00:00,  6.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9252s, loss = 0.0244, accuracy: 100.0000%\n",
      "* Validation for epoch 94:\n",
      "-> Valid. time: 0.0221s, loss: 0.0193, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 94:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 95:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1403s, loss: 0.0248: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9174s, loss = 0.0248, accuracy: 100.0000%\n",
      "* Validation for epoch 95:\n",
      "-> Valid. time: 0.0220s, loss: 0.0192, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 95:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 96:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0240: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9174s, loss = 0.0240, accuracy: 100.0000%\n",
      "* Validation for epoch 96:\n",
      "-> Valid. time: 0.0214s, loss: 0.0192, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 96:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 97:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1389s, loss: 0.0256: 100%|██████████| 6/6 [00:00<00:00,  6.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9115s, loss = 0.0256, accuracy: 100.0000%\n",
      "* Validation for epoch 97:\n",
      "-> Valid. time: 0.0226s, loss: 0.0192, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 97:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 98:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1389s, loss: 0.0247: 100%|██████████| 6/6 [00:00<00:00,  6.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9147s, loss = 0.0247, accuracy: 100.0000%\n",
      "* Validation for epoch 98:\n",
      "-> Valid. time: 0.0242s, loss: 0.0191, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 98:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 99:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1398s, loss: 0.0244: 100%|██████████| 6/6 [00:00<00:00,  6.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9164s, loss = 0.0244, accuracy: 100.0000%\n",
      "* Validation for epoch 99:\n",
      "-> Valid. time: 0.0209s, loss: 0.0191, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 99:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "* Training epoch 100:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1401s, loss: 0.0239: 100%|██████████| 6/6 [00:00<00:00,  6.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9178s, loss = 0.0239, accuracy: 100.0000%\n",
      "* Validation for epoch 100:\n",
      "-> Valid. time: 0.0212s, loss: 0.0191, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 100:\n",
      "Test accuracy: 0.6831%\n",
      "\n",
      "Accuracy: 68.3%\n",
      "Precision: 73.2%\n",
      "Recall: 68.4%\n",
      "F1: 66.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.840     0.454     0.589       912\n",
      "     class_1      0.625     0.913     0.742       909\n",
      "\n",
      "    accuracy                          0.683      1821\n",
      "   macro avg      0.732     0.684     0.666      1821\n",
      "weighted avg      0.733     0.683     0.666      1821\n",
      "\n",
      "K: 400\n",
      "sim: 0.5\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-27-6b3e293aa7ac>:16: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.\n",
      "  max_k_results_df = pd.concat([max_k_results_df, pd.DataFrame({'K': K, 'acc': [acc], 'f1': [f1]})], ignore_index=True)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "sim: 0.75\n",
      "sim: 0.875\n",
      "sim: 0.8125\n",
      "sim: 0.84375\n",
      "sim: 0.5\n",
      "sim: 0.75\n",
      "sim: 0.875\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6635, accuracy: 65.0000%, auc: 0.6667\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1460s, loss: 0.3484: 100%|██████████| 23/23 [00:03<00:00,  6.32it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.6420s, loss = 0.3484, accuracy: 88.0556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1082s, loss: 0.0980, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5887%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1459s, loss: 0.0861: 100%|██████████| 23/23 [00:03<00:00,  6.32it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.6444s, loss = 0.0861, accuracy: 98.0556%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1160s, loss: 0.0311, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6925%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1491s, loss: 0.0293: 100%|██████████| 23/23 [00:03<00:00,  6.20it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7110s, loss = 0.0293, accuracy: 99.7222%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1127s, loss: 0.0366, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 69.2%\n",
      "Precision: 75.0%\n",
      "Recall: 69.3%\n",
      "F1: 67.4%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.871     0.453     0.596       912\n",
      "     class_1      0.630     0.933     0.752       909\n",
      "\n",
      "    accuracy                          0.692      1821\n",
      "   macro avg      0.750     0.693     0.674      1821\n",
      "weighted avg      0.751     0.692     0.674      1821\n",
      "\n",
      "K: 700\n",
      "sim: 0.5\n",
      "sim: 0.75\n",
      "sim: 0.875\n",
      "sim: 0.9375\n",
      "sim: 0.90625\n",
      "sim: 0.890625\n",
      "sim: 0.8828125\n",
      "sim: 0.5\n"
     ]
    }
   ],
   "source": [
    "pos_cos_sim = cosine_similarity(pos_syn_df['embedding'].tolist())\n",
    "neg_cos_sim = cosine_similarity(neg_syn_df['embedding'].tolist())\n",
    "\n",
    "max_k_results_df = pd.DataFrame(columns=['K', 'sim_thresh', 'acc', 'f1'])\n",
    "results_save_name = f\"max_k_results-{datestr}.csv\"\n",
    "\n",
    "for K in Ks:\n",
    "  print(f\"K: {K}\")\n",
    "  _, _, pos_selected_samples = calculate_similarity_threshold(pos_cos_sim, K//2, 0.9)\n",
    "  _, _, neg_selected_samples = calculate_similarity_threshold(neg_cos_sim, K//2, 0.9)\n",
    "\n",
    "  sel_data_df = pd.concat([pos_syn_df.iloc[pos_selected_samples], neg_syn_df.iloc[neg_selected_samples]])\n",
    "\n",
    "  for i in range(NUM_REPS):\n",
    "    acc, f1 = train_model_max_cover(sel_data_df, test_df, target_dir)\n",
    "    max_k_results_df = pd.concat([max_k_results_df, pd.DataFrame({'K': K, 'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
    "  max_k_results_df.to_csv(os.path.join(target_dir, results_save_name))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "2ionoHMu6OHk"
   },
   "source": [
    "### Train model on random k samples"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000,
     "referenced_widgets": [
      "3711473f681a489297a32650a74fa2c2",
      "ff33a45708ae4331beb0a037de6e42bb",
      "6525bad8ac6743f0ae5bc7fa4b6842f3",
      "ef73adeea2034e36b82a721bde5fe6ed",
      "a305e6d37d4d48028dd90f4eb5f8f2b1",
      "0c72b6cbae2a4a5088f6f750f657ba72",
      "1f32563781234251ab589618c62441ee",
      "4576e26b03794806a18db8960f77f3ea",
      "996ecf66ca0a4080b03f5fe08a3799c5",
      "b25d0ebb00ce4d2aa4840169353e6e6b",
      "15880d1eafff4e8885ec11fc66eb20ec",
      "9260c4eced3f4053bbe3e553b6c54978",
      "5a119b8b191d42879f23a320a5002ce4",
      "129e20221232419bbc3533cbab76fa93",
      "1991f4cbf9d5438e83fad021c2677972",
      "44f88c1a61f146ee9ba2d85c98286d5c",
      "714320b450f44064994d2d797ecf3a77",
      "582cc43ffa344802b78bbf47c7dcfb6f",
      "663506a165b1427796274d381d366123",
      "b02bd446fd2d48ad8951ccfa02a59cf8",
      "a53848f15e4a4ac5ae6cb2deb30f1da5",
      "2a98e22cdc8b4b338aeccf00c76500e1",
      "0826f510218b466eb1845043abcc4130",
      "516971a7b62b4945a6fa34e65d099f69",
      "2473829b9c2742b9b7c2e093a930bcdf",
      "7257ed6000954b09b13c63c136715882",
      "81b9b9bece6a4337a7cf8e6b9017feec",
      "90fc6dcd85f84a3ea7a65d561f9a868e",
      "316d53715c7d4c179c41422ece261a2b",
      "9d9c9ab3a1ad4e58addb885271776867",
      "9bac258e5421495298ec04d03c9cfc47",
      "ace708058b7946c680e4ea72a992269c",
      "8fda0d670095475cbfb0e0476365904b",
      "09f10b2958e842f3ab7e18035efdf75d",
      "d95cc2c3c9a443afbc9a8ca768fc8007",
      "af3da40cc65649c89236a8a37a2eb3ea",
      "1a67f5ffeb9746a3a37883dec437e968",
      "57e6bc8f31b84afa92732ea307d3942f",
      "0d1e360d2139470c807f04fc1b46f221",
      "5f5833d9c53b4d43b40ef63b2824704e",
      "90606f8bed0146adb43a136f0ea72b17",
      "80a1bd7652e74a4e95557db515e2adce",
      "309413fde8764de2b13567284e472aa4",
      "7828c2d9620d47d982c83d7f826325d8",
      "e36d0c0249674223af00ab11b891dba1",
      "72dd61e0324a4d64b7701473712b1ef2",
      "b13e0504180649828cd2924f8c56a58a",
      "bc166cef93ec4221882275fcf3b9ac6b",
      "bcec675da8d54fdbb8b215b2bc309e2b",
      "ae9a1b61dfd64d2dae92f6a671ec1763",
      "63f42b7ff026482a93efac91478215e4",
      "5ef28d4b85c446698225f093d90f1bac",
      "02edcbf7bbc249a29ad244b0428531a8",
      "9e64068e1aed4268971e33425aebb79a",
      "e2344bcd967a46c98edcb30d83b736c7"
     ]
    },
    "executionInfo": {
     "elapsed": 2509922,
     "status": "ok",
     "timestamp": 1726507711273,
     "user": {
      "displayName": "Max Springer",
      "userId": "10242344097673962660"
     },
     "user_tz": 240
    },
    "id": "7wbyHUhy6QJZ",
    "outputId": "2a58301d-fe00-445a-a5d4-f61d4ac980a7"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "100\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "3711473f681a489297a32650a74fa2c2",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "config.json:   0%|          | 0.00/570 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "9260c4eced3f4053bbe3e553b6c54978",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "model.safetensors:   0%|          | 0.00/440M [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "0826f510218b466eb1845043abcc4130",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "09f10b2958e842f3ab7e18035efdf75d",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e36d0c0249674223af00ab11b891dba1",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7242, accuracy: 50.0000%, auc: 0.6875\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.2274s, loss: 0.6453: 100%|██████████| 6/6 [00:01<00:00,  4.20it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.4328s, loss = 0.6453, accuracy: 61.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0208s, loss: 0.4897, accuracy: 90.0000%, auc: 0.9375\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5409%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1320s, loss: 0.4405: 100%|██████████| 6/6 [00:00<00:00,  6.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8644s, loss = 0.4405, accuracy: 90.0000%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0214s, loss: 0.3504, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5678%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1334s, loss: 0.2754: 100%|██████████| 6/6 [00:00<00:00,  6.87it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8771s, loss = 0.2754, accuracy: 95.5556%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0205s, loss: 0.2194, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6216%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1333s, loss: 0.1527: 100%|██████████| 6/6 [00:00<00:00,  6.89it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8737s, loss = 0.1527, accuracy: 98.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0199s, loss: 0.1584, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6266%\n",
      "\n",
      "Accuracy: 62.7%\n",
      "Precision: 62.7%\n",
      "Recall: 62.7%\n",
      "F1: 62.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.617     0.669     0.642       912\n",
      "     class_1      0.637     0.584     0.610       909\n",
      "\n",
      "    accuracy                          0.627      1821\n",
      "   macro avg      0.627     0.627     0.626      1821\n",
      "weighted avg      0.627     0.627     0.626      1821\n",
      "\n",
      "100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-17-0394ae4329a4>:13: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.\n",
      "  rand_k_results_df = pd.concat([rand_k_results_df, pd.DataFrame({'K': K, 'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6603, accuracy: 80.0000%, auc: 0.1250\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1368s, loss: 0.6206: 100%|██████████| 6/6 [00:00<00:00,  6.76it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8925s, loss = 0.6206, accuracy: 71.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0225s, loss: 0.5273, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5629%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1356s, loss: 0.4240: 100%|██████████| 6/6 [00:00<00:00,  6.78it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8880s, loss = 0.4240, accuracy: 94.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0227s, loss: 0.3200, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5761%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1362s, loss: 0.2881: 100%|██████████| 6/6 [00:00<00:00,  6.76it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8918s, loss = 0.2881, accuracy: 95.5556%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0229s, loss: 0.2482, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6129%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1362s, loss: 0.1603: 100%|██████████| 6/6 [00:00<00:00,  6.76it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.8915s, loss = 0.1603, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0212s, loss: 0.1351, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6205%\n",
      "\n",
      "Accuracy: 62.1%\n",
      "Precision: 63.0%\n",
      "Recall: 62.0%\n",
      "F1: 61.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.595     0.759     0.667       912\n",
      "     class_1      0.666     0.482     0.559       909\n",
      "\n",
      "    accuracy                          0.621      1821\n",
      "   macro avg      0.630     0.620     0.613      1821\n",
      "weighted avg      0.630     0.621     0.613      1821\n",
      "\n",
      "100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.7788, accuracy: 20.0000%, auc: 0.3125\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1416s, loss: 0.5860: 100%|██████████| 6/6 [00:00<00:00,  6.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9308s, loss = 0.5860, accuracy: 72.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0208s, loss: 0.5359, accuracy: 70.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5239%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1384s, loss: 0.4028: 100%|██████████| 6/6 [00:00<00:00,  6.64it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9080s, loss = 0.4028, accuracy: 92.2222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0214s, loss: 0.3340, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5634%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1392s, loss: 0.2650: 100%|██████████| 6/6 [00:00<00:00,  6.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9100s, loss = 0.2650, accuracy: 98.8889%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0211s, loss: 0.2084, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6024%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1372s, loss: 0.1578: 100%|██████████| 6/6 [00:00<00:00,  6.69it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9008s, loss = 0.1578, accuracy: 98.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0244s, loss: 0.1231, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.5980%\n",
      "\n",
      "Accuracy: 59.8%\n",
      "Precision: 62.0%\n",
      "Recall: 59.8%\n",
      "F1: 57.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.569     0.815     0.670       912\n",
      "     class_1      0.672     0.381     0.486       909\n",
      "\n",
      "    accuracy                          0.598      1821\n",
      "   macro avg      0.620     0.598     0.578      1821\n",
      "weighted avg      0.620     0.598     0.578      1821\n",
      "\n",
      "100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.8020, accuracy: 20.0000%, auc: 0.7500\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1438s, loss: 0.5452: 100%|██████████| 6/6 [00:00<00:00,  6.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9370s, loss = 0.5452, accuracy: 74.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0215s, loss: 0.6210, accuracy: 60.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5157%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1416s, loss: 0.4704: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9278s, loss = 0.4704, accuracy: 77.7778%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0232s, loss: 0.2648, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5744%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1415s, loss: 0.3151: 100%|██████████| 6/6 [00:00<00:00,  6.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9261s, loss = 0.3151, accuracy: 91.1111%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0236s, loss: 0.2049, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6019%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1399s, loss: 0.2018: 100%|██████████| 6/6 [00:00<00:00,  6.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9175s, loss = 0.2018, accuracy: 97.7778%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0252s, loss: 0.2729, accuracy: 90.0000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 60.2%\n",
      "Precision: 61.2%\n",
      "Recall: 60.2%\n",
      "F1: 59.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.579     0.752     0.654       912\n",
      "     class_1      0.645     0.451     0.531       909\n",
      "\n",
      "    accuracy                          0.602      1821\n",
      "   macro avg      0.612     0.602     0.593      1821\n",
      "weighted avg      0.612     0.602     0.593      1821\n",
      "\n",
      "100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.6343, accuracy: 80.0000%, auc: 0.6250\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1461s, loss: 0.6483: 100%|██████████| 6/6 [00:00<00:00,  6.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9484s, loss = 0.6483, accuracy: 67.7778%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0237s, loss: 0.5361, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5832%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1444s, loss: 0.4540: 100%|██████████| 6/6 [00:00<00:00,  6.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9464s, loss = 0.4540, accuracy: 90.0000%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0240s, loss: 0.3620, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6348%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1445s, loss: 0.2670: 100%|██████████| 6/6 [00:00<00:00,  6.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9457s, loss = 0.2670, accuracy: 96.6667%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0234s, loss: 0.2171, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6678%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1447s, loss: 0.1507: 100%|██████████| 6/6 [00:00<00:00,  6.37it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 0.9445s, loss = 0.1507, accuracy: 98.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0226s, loss: 0.1585, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6694%\n",
      "\n",
      "Accuracy: 66.9%\n",
      "Precision: 67.1%\n",
      "Recall: 66.9%\n",
      "F1: 66.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.688     0.623     0.654       912\n",
      "     class_1      0.654     0.716     0.684       909\n",
      "\n",
      "    accuracy                          0.669      1821\n",
      "   macro avg      0.671     0.669     0.669      1821\n",
      "weighted avg      0.671     0.669     0.669      1821\n",
      "\n",
      "200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.6930, accuracy: 60.0000%, auc: 0.3737\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1480s, loss: 0.5554: 100%|██████████| 12/12 [00:01<00:00,  6.27it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9186s, loss = 0.5554, accuracy: 73.8889%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0539s, loss: 0.2939, accuracy: 95.0000%, auc: 0.9899\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5338%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1459s, loss: 0.2817: 100%|██████████| 12/12 [00:01<00:00,  6.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.8996s, loss = 0.2817, accuracy: 96.6667%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0518s, loss: 0.0902, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5826%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1475s, loss: 0.0930: 100%|██████████| 12/12 [00:01<00:00,  6.27it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9193s, loss = 0.0930, accuracy: 98.8889%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0524s, loss: 0.0367, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.5986%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1475s, loss: 0.0551: 100%|██████████| 12/12 [00:01<00:00,  6.27it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9183s, loss = 0.0551, accuracy: 98.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0552s, loss: 0.0191, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6123%\n",
      "\n",
      "Accuracy: 61.2%\n",
      "Precision: 62.0%\n",
      "Recall: 61.3%\n",
      "F1: 60.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.649     0.491     0.559       912\n",
      "     class_1      0.590     0.734     0.654       909\n",
      "\n",
      "    accuracy                          0.612      1821\n",
      "   macro avg      0.620     0.613     0.607      1821\n",
      "weighted avg      0.620     0.612     0.607      1821\n",
      "\n",
      "200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.6921, accuracy: 55.0000%, auc: 0.7374\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1481s, loss: 0.5912: 100%|██████████| 12/12 [00:01<00:00,  6.26it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9210s, loss = 0.5912, accuracy: 70.5556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0526s, loss: 0.3137, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5728%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1478s, loss: 0.2435: 100%|██████████| 12/12 [00:01<00:00,  6.24it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9282s, loss = 0.2435, accuracy: 97.2222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0500s, loss: 0.0904, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6919%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1469s, loss: 0.0781: 100%|██████████| 12/12 [00:01<00:00,  6.29it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9096s, loss = 0.0781, accuracy: 99.4444%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0512s, loss: 0.0430, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7188%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1470s, loss: 0.0312: 100%|██████████| 12/12 [00:01<00:00,  6.29it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9113s, loss = 0.0312, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0517s, loss: 0.0173, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7287%\n",
      "\n",
      "Accuracy: 72.9%\n",
      "Precision: 72.9%\n",
      "Recall: 72.9%\n",
      "F1: 72.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.736     0.714     0.725       912\n",
      "     class_1      0.721     0.744     0.732       909\n",
      "\n",
      "    accuracy                          0.729      1821\n",
      "   macro avg      0.729     0.729     0.729      1821\n",
      "weighted avg      0.729     0.729     0.729      1821\n",
      "\n",
      "200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.8238, accuracy: 35.0000%, auc: 0.4040\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1488s, loss: 0.5146: 100%|██████████| 12/12 [00:01<00:00,  6.22it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9321s, loss = 0.5146, accuracy: 73.8889%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0515s, loss: 0.3393, accuracy: 85.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5513%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1476s, loss: 0.2444: 100%|██████████| 12/12 [00:01<00:00,  6.27it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9187s, loss = 0.2444, accuracy: 95.5556%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0526s, loss: 0.2526, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6150%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1478s, loss: 0.1061: 100%|██████████| 12/12 [00:01<00:00,  6.26it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9197s, loss = 0.1061, accuracy: 98.3333%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0516s, loss: 0.0547, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6420%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1470s, loss: 0.0579: 100%|██████████| 12/12 [00:01<00:00,  6.29it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9136s, loss = 0.0579, accuracy: 99.4444%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0504s, loss: 0.0290, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6507%\n",
      "\n",
      "Accuracy: 65.1%\n",
      "Precision: 65.2%\n",
      "Recall: 65.1%\n",
      "F1: 65.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.638     0.700     0.667       912\n",
      "     class_1      0.666     0.602     0.632       909\n",
      "\n",
      "    accuracy                          0.651      1821\n",
      "   macro avg      0.652     0.651     0.650      1821\n",
      "weighted avg      0.652     0.651     0.650      1821\n",
      "\n",
      "200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.7316, accuracy: 35.0000%, auc: 0.1818\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1491s, loss: 0.6247: 100%|██████████| 12/12 [00:01<00:00,  6.21it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9347s, loss = 0.6247, accuracy: 65.5556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0532s, loss: 0.4359, accuracy: 95.0000%, auc: 0.9899\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5453%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1470s, loss: 0.3380: 100%|██████████| 12/12 [00:01<00:00,  6.29it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9132s, loss = 0.3380, accuracy: 94.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0515s, loss: 0.1694, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5722%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1476s, loss: 0.1598: 100%|██████████| 12/12 [00:01<00:00,  6.27it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9178s, loss = 0.1598, accuracy: 97.2222%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0498s, loss: 0.1714, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 57.2%\n",
      "Precision: 57.3%\n",
      "Recall: 57.2%\n",
      "F1: 57.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.566     0.627     0.595       912\n",
      "     class_1      0.580     0.517     0.547       909\n",
      "\n",
      "    accuracy                          0.572      1821\n",
      "   macro avg      0.573     0.572     0.571      1821\n",
      "weighted avg      0.573     0.572     0.571      1821\n",
      "\n",
      "200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\t* Building model...\n",
      "\n",
      "* Validation loss before training: 0.6872, accuracy: 50.0000%, auc: 0.4747\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1484s, loss: 0.5322: 100%|██████████| 12/12 [00:01<00:00,  6.25it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9255s, loss = 0.5322, accuracy: 73.3333%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0501s, loss: 0.3012, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5832%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1474s, loss: 0.2353: 100%|██████████| 12/12 [00:01<00:00,  6.28it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9151s, loss = 0.2353, accuracy: 95.0000%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0525s, loss: 0.1376, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6733%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1468s, loss: 0.1159: 100%|██████████| 12/12 [00:01<00:00,  6.30it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 1.9087s, loss = 0.1159, accuracy: 97.7778%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0524s, loss: 0.0822, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 67.3%\n",
      "Precision: 67.3%\n",
      "Recall: 67.3%\n",
      "F1: 67.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.668     0.690     0.679       912\n",
      "     class_1      0.678     0.657     0.667       909\n",
      "\n",
      "    accuracy                          0.673      1821\n",
      "   macro avg      0.673     0.673     0.673      1821\n",
      "weighted avg      0.673     0.673     0.673      1821\n",
      "\n",
      "300\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7126, accuracy: 53.3333%, auc: 0.7054\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.4503: 100%|██████████| 17/17 [00:02<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8488s, loss = 0.4503, accuracy: 81.4815%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0811s, loss: 0.2120, accuracy: 96.6667%, auc: 0.9955\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6107%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.1400: 100%|██████████| 17/17 [00:02<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8372s, loss = 0.1400, accuracy: 98.1481%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0839s, loss: 0.1217, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7183%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1536s, loss: 0.0584: 100%|██████████| 17/17 [00:02<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8234s, loss = 0.0584, accuracy: 99.2593%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0813s, loss: 0.0254, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7721%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.0368: 100%|██████████| 17/17 [00:02<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8367s, loss = 0.0368, accuracy: 99.2593%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0816s, loss: 0.1179, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 77.2%\n",
      "Precision: 78.5%\n",
      "Recall: 77.2%\n",
      "F1: 77.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.845     0.668     0.746       912\n",
      "     class_1      0.725     0.877     0.793       909\n",
      "\n",
      "    accuracy                          0.772      1821\n",
      "   macro avg      0.785     0.772     0.770      1821\n",
      "weighted avg      0.785     0.772     0.770      1821\n",
      "\n",
      "300\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7485, accuracy: 36.6667%, auc: 0.3571\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1560s, loss: 0.4296: 100%|██████████| 17/17 [00:02<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8582s, loss = 0.4296, accuracy: 82.9630%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0838s, loss: 0.2001, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5184%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.1421: 100%|██████████| 17/17 [00:02<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8248s, loss = 0.1421, accuracy: 97.7778%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0819s, loss: 0.0805, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6238%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.0556: 100%|██████████| 17/17 [00:02<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8262s, loss = 0.0556, accuracy: 99.6296%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0839s, loss: 0.0334, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6859%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1545s, loss: 0.0285: 100%|██████████| 17/17 [00:02<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8378s, loss = 0.0285, accuracy: 99.6296%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0804s, loss: 0.0952, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 68.6%\n",
      "Precision: 71.1%\n",
      "Recall: 68.6%\n",
      "F1: 67.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.638     0.860     0.733       912\n",
      "     class_1      0.784     0.512     0.619       909\n",
      "\n",
      "    accuracy                          0.686      1821\n",
      "   macro avg      0.711     0.686     0.676      1821\n",
      "weighted avg      0.711     0.686     0.676      1821\n",
      "\n",
      "300\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6796, accuracy: 66.6667%, auc: 0.6652\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1557s, loss: 0.5074: 100%|██████████| 17/17 [00:02<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8552s, loss = 0.5074, accuracy: 80.0000%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0818s, loss: 0.2448, accuracy: 96.6667%, auc: 0.9955\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5936%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.1701: 100%|██████████| 17/17 [00:02<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8256s, loss = 0.1701, accuracy: 96.6667%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0839s, loss: 0.0986, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6787%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.0423: 100%|██████████| 17/17 [00:02<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8316s, loss = 0.0423, accuracy: 99.6296%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0801s, loss: 0.0887, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7342%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.0160: 100%|██████████| 17/17 [00:02<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8328s, loss = 0.0160, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0809s, loss: 0.0793, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7232%\n",
      "\n",
      "Accuracy: 72.3%\n",
      "Precision: 73.6%\n",
      "Recall: 72.3%\n",
      "F1: 72.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.791     0.607     0.687       912\n",
      "     class_1      0.681     0.839     0.752       909\n",
      "\n",
      "    accuracy                          0.723      1821\n",
      "   macro avg      0.736     0.723     0.720      1821\n",
      "weighted avg      0.736     0.723     0.719      1821\n",
      "\n",
      "300\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8146, accuracy: 33.3333%, auc: 0.2768\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.5032: 100%|██████████| 17/17 [00:02<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8478s, loss = 0.5032, accuracy: 77.4074%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0799s, loss: 0.2123, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5272%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.2056: 100%|██████████| 17/17 [00:02<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8223s, loss = 0.2056, accuracy: 95.5556%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0834s, loss: 0.1287, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5393%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.0726: 100%|██████████| 17/17 [00:02<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8458s, loss = 0.0726, accuracy: 99.2593%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0831s, loss: 0.0386, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6403%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0430: 100%|██████████| 17/17 [00:02<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8521s, loss = 0.0430, accuracy: 99.6296%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0817s, loss: 0.0253, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6227%\n",
      "\n",
      "Accuracy: 62.3%\n",
      "Precision: 68.7%\n",
      "Recall: 62.2%\n",
      "F1: 58.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.578     0.916     0.709       912\n",
      "     class_1      0.795     0.329     0.465       909\n",
      "\n",
      "    accuracy                          0.623      1821\n",
      "   macro avg      0.687     0.622     0.587      1821\n",
      "weighted avg      0.686     0.623     0.587      1821\n",
      "\n",
      "300\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6988, accuracy: 50.0000%, auc: 0.5089\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.5424: 100%|██████████| 17/17 [00:02<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8389s, loss = 0.5424, accuracy: 78.5185%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.0831s, loss: 0.2450, accuracy: 93.3333%, auc: 0.9955\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5524%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.1799: 100%|██████████| 17/17 [00:02<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8267s, loss = 0.1799, accuracy: 96.2963%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.0836s, loss: 0.0945, accuracy: 96.6667%, auc: 0.9955\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6189%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1537s, loss: 0.0451: 100%|██████████| 17/17 [00:02<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8261s, loss = 0.0451, accuracy: 99.6296%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.0760s, loss: 0.0958, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6546%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.0338: 100%|██████████| 17/17 [00:02<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 2.8193s, loss = 0.0338, accuracy: 99.2593%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.0824s, loss: 0.0679, accuracy: 96.6667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6650%\n",
      "\n",
      "Accuracy: 66.5%\n",
      "Precision: 72.0%\n",
      "Recall: 66.5%\n",
      "F1: 64.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.610     0.916     0.732       912\n",
      "     class_1      0.830     0.414     0.552       909\n",
      "\n",
      "    accuracy                          0.665      1821\n",
      "   macro avg      0.720     0.665     0.642      1821\n",
      "weighted avg      0.720     0.665     0.642      1821\n",
      "\n",
      "400\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6517, accuracy: 55.0000%, auc: 0.7045\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1530s, loss: 0.3942: 100%|██████████| 23/23 [00:03<00:00,  6.07it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7943s, loss = 0.3942, accuracy: 88.0556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1233s, loss: 0.1121, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6573%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1530s, loss: 0.0857: 100%|██████████| 23/23 [00:03<00:00,  6.05it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8034s, loss = 0.0857, accuracy: 98.0556%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1202s, loss: 0.0361, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7287%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1528s, loss: 0.0173: 100%|██████████| 23/23 [00:03<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8129s, loss = 0.0173, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1205s, loss: 0.0096, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6145%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1518s, loss: 0.0110: 100%|██████████| 23/23 [00:03<00:00,  6.11it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7704s, loss = 0.0110, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1199s, loss: 0.0058, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6502%\n",
      "\n",
      "Accuracy: 65.0%\n",
      "Precision: 73.0%\n",
      "Recall: 65.1%\n",
      "F1: 61.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.867     0.356     0.505       912\n",
      "     class_1      0.594     0.945     0.730       909\n",
      "\n",
      "    accuracy                          0.650      1821\n",
      "   macro avg      0.730     0.651     0.617      1821\n",
      "weighted avg      0.731     0.650     0.617      1821\n",
      "\n",
      "400\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6761, accuracy: 50.0000%, auc: 0.8182\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1527s, loss: 0.3927: 100%|██████████| 23/23 [00:03<00:00,  6.07it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7928s, loss = 0.3927, accuracy: 85.5556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1186s, loss: 0.1559, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6771%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1526s, loss: 0.0979: 100%|██████████| 23/23 [00:03<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7989s, loss = 0.0979, accuracy: 98.3333%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1251s, loss: 0.0487, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7622%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.0243: 100%|██████████| 23/23 [00:03<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8104s, loss = 0.0243, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1262s, loss: 0.0497, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7748%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1530s, loss: 0.0143: 100%|██████████| 23/23 [00:03<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8001s, loss = 0.0143, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1229s, loss: 0.0060, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6496%\n",
      "\n",
      "Accuracy: 65.0%\n",
      "Precision: 75.7%\n",
      "Recall: 65.0%\n",
      "F1: 60.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.923     0.328     0.484       912\n",
      "     class_1      0.591     0.972     0.735       909\n",
      "\n",
      "    accuracy                          0.650      1821\n",
      "   macro avg      0.757     0.650     0.609      1821\n",
      "weighted avg      0.757     0.650     0.609      1821\n",
      "\n",
      "400\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7129, accuracy: 37.5000%, auc: 0.4268\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.4366: 100%|██████████| 23/23 [00:03<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8187s, loss = 0.4366, accuracy: 84.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1252s, loss: 0.1498, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6348%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1522s, loss: 0.1177: 100%|██████████| 23/23 [00:03<00:00,  6.08it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7839s, loss = 0.1177, accuracy: 98.3333%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1192s, loss: 0.0302, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6864%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1525s, loss: 0.0237: 100%|██████████| 23/23 [00:03<00:00,  6.07it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7945s, loss = 0.0237, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1224s, loss: 0.0113, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7090%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1532s, loss: 0.0111: 100%|██████████| 23/23 [00:03<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7997s, loss = 0.0111, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1172s, loss: 0.0065, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7232%\n",
      "\n",
      "Accuracy: 72.3%\n",
      "Precision: 72.4%\n",
      "Recall: 72.3%\n",
      "F1: 72.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.709     0.759     0.733       912\n",
      "     class_1      0.740     0.688     0.713       909\n",
      "\n",
      "    accuracy                          0.723      1821\n",
      "   macro avg      0.724     0.723     0.723      1821\n",
      "weighted avg      0.724     0.723     0.723      1821\n",
      "\n",
      "400\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8147, accuracy: 42.5000%, auc: 0.5101\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.3417: 100%|██████████| 23/23 [00:03<00:00,  6.05it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8039s, loss = 0.3417, accuracy: 86.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1237s, loss: 0.1170, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6535%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1524s, loss: 0.0666: 100%|██████████| 23/23 [00:03<00:00,  6.08it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7886s, loss = 0.0666, accuracy: 99.1667%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1226s, loss: 0.0219, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7699%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.0188: 100%|██████████| 23/23 [00:03<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8158s, loss = 0.0188, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1212s, loss: 0.0297, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7853%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1524s, loss: 0.0210: 100%|██████████| 23/23 [00:03<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7964s, loss = 0.0210, accuracy: 99.7222%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1211s, loss: 0.0111, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7716%\n",
      "\n",
      "Accuracy: 77.2%\n",
      "Precision: 77.2%\n",
      "Recall: 77.2%\n",
      "F1: 77.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.788     0.745     0.766       912\n",
      "     class_1      0.757     0.799     0.777       909\n",
      "\n",
      "    accuracy                          0.772      1821\n",
      "   macro avg      0.772     0.772     0.771      1821\n",
      "weighted avg      0.772     0.772     0.771      1821\n",
      "\n",
      "400\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6427, accuracy: 62.5000%, auc: 0.6717\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.3821: 100%|██████████| 23/23 [00:03<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8250s, loss = 0.3821, accuracy: 87.5000%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1196s, loss: 0.1952, accuracy: 97.5000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6359%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1529s, loss: 0.1157: 100%|██████████| 23/23 [00:03<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.7991s, loss = 0.1157, accuracy: 97.5000%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1216s, loss: 0.0399, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6425%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1530s, loss: 0.0537: 100%|██████████| 23/23 [00:03<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 3.8148s, loss = 0.0537, accuracy: 99.4444%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1240s, loss: 0.1448, accuracy: 95.0000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 64.3%\n",
      "Precision: 71.6%\n",
      "Recall: 64.3%\n",
      "F1: 61.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.843     0.352     0.497       912\n",
      "     class_1      0.590     0.934     0.723       909\n",
      "\n",
      "    accuracy                          0.643      1821\n",
      "   macro avg      0.716     0.643     0.610      1821\n",
      "weighted avg      0.716     0.643     0.610      1821\n",
      "\n",
      "500\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7909, accuracy: 46.0000%, auc: 0.3344\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1530s, loss: 0.3629: 100%|██████████| 29/29 [00:04<00:00,  6.05it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7954s, loss = 0.3629, accuracy: 87.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1571s, loss: 0.4589, accuracy: 98.0000%, auc: 0.9872\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6090%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1515s, loss: 0.0798: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7575s, loss = 0.0798, accuracy: 98.2222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1632s, loss: 0.0685, accuracy: 98.0000%, auc: 0.9984\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6518%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1513s, loss: 0.0355: 100%|██████████| 29/29 [00:04<00:00,  6.12it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7473s, loss = 0.0355, accuracy: 99.3333%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1611s, loss: 0.0558, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7232%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1510s, loss: 0.0103: 100%|██████████| 29/29 [00:04<00:00,  6.12it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7414s, loss = 0.0103, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1568s, loss: 0.0641, accuracy: 98.0000%, auc: 0.9984\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7287%\n",
      "\n",
      "Accuracy: 72.9%\n",
      "Precision: 73.2%\n",
      "Recall: 72.9%\n",
      "F1: 72.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.704     0.791     0.745       912\n",
      "     class_1      0.760     0.667     0.710       909\n",
      "\n",
      "    accuracy                          0.729      1821\n",
      "   macro avg      0.732     0.729     0.728      1821\n",
      "weighted avg      0.732     0.729     0.728      1821\n",
      "\n",
      "500\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7116, accuracy: 54.0000%, auc: 0.6720\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1523s, loss: 0.3284: 100%|██████████| 29/29 [00:04<00:00,  6.08it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7742s, loss = 0.3284, accuracy: 88.6667%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1565s, loss: 0.1633, accuracy: 94.0000%, auc: 0.9936\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6431%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1519s, loss: 0.0507: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7608s, loss = 0.0507, accuracy: 99.1111%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1618s, loss: 0.1241, accuracy: 96.0000%, auc: 0.9968\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6870%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1519s, loss: 0.0319: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7597s, loss = 0.0319, accuracy: 99.1111%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1586s, loss: 0.1794, accuracy: 96.0000%, auc: 0.9968\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6337%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1516s, loss: 0.0254: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7630s, loss = 0.0254, accuracy: 99.1111%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1575s, loss: 0.0705, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7188%\n",
      "\n",
      "Accuracy: 71.9%\n",
      "Precision: 74.0%\n",
      "Recall: 71.9%\n",
      "F1: 71.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.812     0.571     0.671       912\n",
      "     class_1      0.668     0.867     0.755       909\n",
      "\n",
      "    accuracy                          0.719      1821\n",
      "   macro avg      0.740     0.719     0.713      1821\n",
      "weighted avg      0.740     0.719     0.713      1821\n",
      "\n",
      "500\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7238, accuracy: 36.0000%, auc: 0.3200\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1527s, loss: 0.4085: 100%|██████████| 29/29 [00:04<00:00,  6.07it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7843s, loss = 0.4085, accuracy: 86.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1550s, loss: 0.3499, accuracy: 92.0000%, auc: 0.9904\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5541%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1517s, loss: 0.0808: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7551s, loss = 0.0808, accuracy: 98.2222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1558s, loss: 0.0923, accuracy: 96.0000%, auc: 0.9936\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6348%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1519s, loss: 0.0210: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7579s, loss = 0.0210, accuracy: 99.7778%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1581s, loss: 0.0919, accuracy: 96.0000%, auc: 0.9984\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6518%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1528s, loss: 0.0188: 100%|██████████| 29/29 [00:04<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7888s, loss = 0.0188, accuracy: 99.5556%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1035s, loss: 0.0414, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "Accuracy: 68.4%\n",
      "Precision: 68.5%\n",
      "Recall: 68.4%\n",
      "F1: 68.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.668     0.731     0.698       912\n",
      "     class_1      0.702     0.636     0.667       909\n",
      "\n",
      "    accuracy                          0.684      1821\n",
      "   macro avg      0.685     0.684     0.683      1821\n",
      "weighted avg      0.685     0.684     0.683      1821\n",
      "\n",
      "500\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7010, accuracy: 46.0000%, auc: 0.4560\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1523s, loss: 0.3123: 100%|██████████| 29/29 [00:04<00:00,  6.08it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7733s, loss = 0.3123, accuracy: 91.5556%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1523s, loss: 0.1137, accuracy: 98.0000%, auc: 0.9968\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7128%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1515s, loss: 0.0514: 100%|██████████| 29/29 [00:04<00:00,  6.11it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7473s, loss = 0.0514, accuracy: 99.3333%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1528s, loss: 0.0506, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7397%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1517s, loss: 0.0174: 100%|██████████| 29/29 [00:04<00:00,  6.11it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7532s, loss = 0.0174, accuracy: 99.5556%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1558s, loss: 0.0157, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7287%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1520s, loss: 0.0059: 100%|██████████| 29/29 [00:04<00:00,  6.09it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7669s, loss = 0.0059, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1542s, loss: 0.0089, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7117%\n",
      "\n",
      "Accuracy: 71.2%\n",
      "Precision: 72.5%\n",
      "Recall: 71.1%\n",
      "F1: 70.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.671     0.832     0.743       912\n",
      "     class_1      0.778     0.591     0.672       909\n",
      "\n",
      "    accuracy                          0.712      1821\n",
      "   macro avg      0.725     0.711     0.707      1821\n",
      "weighted avg      0.725     0.712     0.707      1821\n",
      "\n",
      "500\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7112, accuracy: 50.0000%, auc: 0.3344\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1532s, loss: 0.3896: 100%|██████████| 29/29 [00:04<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7914s, loss = 0.3896, accuracy: 89.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1545s, loss: 0.2353, accuracy: 94.0000%, auc: 0.9856\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6705%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1523s, loss: 0.0773: 100%|██████████| 29/29 [00:04<00:00,  6.08it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7741s, loss = 0.0773, accuracy: 98.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1598s, loss: 0.0730, accuracy: 98.0000%, auc: 0.9968\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7194%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1519s, loss: 0.0223: 100%|██████████| 29/29 [00:04<00:00,  6.10it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7572s, loss = 0.0223, accuracy: 99.5556%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1516s, loss: 0.0103, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6930%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1518s, loss: 0.0112: 100%|██████████| 29/29 [00:04<00:00,  6.09it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 4.7679s, loss = 0.0112, accuracy: 99.7778%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1560s, loss: 0.0045, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7518%\n",
      "\n",
      "Accuracy: 75.2%\n",
      "Precision: 76.8%\n",
      "Recall: 75.2%\n",
      "F1: 74.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.833     0.630     0.718       912\n",
      "     class_1      0.702     0.873     0.778       909\n",
      "\n",
      "    accuracy                          0.752      1821\n",
      "   macro avg      0.768     0.752     0.748      1821\n",
      "weighted avg      0.768     0.752     0.748      1821\n",
      "\n",
      "600\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6576, accuracy: 65.0000%, auc: 0.7031\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1547s, loss: 0.3121: 100%|██████████| 34/34 [00:05<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6790s, loss = 0.3121, accuracy: 90.3704%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1816s, loss: 0.0781, accuracy: 98.3333%, auc: 0.9967\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6771%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.0392: 100%|██████████| 34/34 [00:05<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.7007s, loss = 0.0392, accuracy: 99.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1785s, loss: 0.0351, accuracy: 98.3333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7463%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1546s, loss: 0.0100: 100%|██████████| 34/34 [00:05<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6833s, loss = 0.0100, accuracy: 99.8148%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1843s, loss: 0.0042, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7452%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.0047: 100%|██████████| 34/34 [00:05<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6648s, loss = 0.0047, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1814s, loss: 0.0027, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7353%\n",
      "\n",
      "Accuracy: 73.5%\n",
      "Precision: 76.0%\n",
      "Recall: 73.5%\n",
      "F1: 72.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.680     0.890     0.771       912\n",
      "     class_1      0.841     0.580     0.686       909\n",
      "\n",
      "    accuracy                          0.735      1821\n",
      "   macro avg      0.760     0.735     0.729      1821\n",
      "weighted avg      0.760     0.735     0.729      1821\n",
      "\n",
      "600\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6555, accuracy: 71.6667%, auc: 0.7333\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.2699: 100%|██████████| 34/34 [00:05<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6825s, loss = 0.2699, accuracy: 91.4815%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1791s, loss: 0.0638, accuracy: 98.3333%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7485%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0444: 100%|██████████| 34/34 [00:05<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6594s, loss = 0.0444, accuracy: 99.2593%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1824s, loss: 0.0108, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7721%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.0239: 100%|██████████| 34/34 [00:05<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6723s, loss = 0.0239, accuracy: 99.6296%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1812s, loss: 0.0050, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7359%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.0252: 100%|██████████| 34/34 [00:05<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6803s, loss = 0.0252, accuracy: 99.4444%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1847s, loss: 0.0036, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7727%\n",
      "\n",
      "Accuracy: 77.3%\n",
      "Precision: 77.3%\n",
      "Recall: 77.3%\n",
      "F1: 77.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.777     0.765     0.771       912\n",
      "     class_1      0.768     0.780     0.774       909\n",
      "\n",
      "    accuracy                          0.773      1821\n",
      "   macro avg      0.773     0.773     0.773      1821\n",
      "weighted avg      0.773     0.773     0.773      1821\n",
      "\n",
      "600\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7305, accuracy: 53.3333%, auc: 0.2723\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.3476: 100%|██████████| 34/34 [00:05<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6992s, loss = 0.3476, accuracy: 86.4815%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1789s, loss: 0.1231, accuracy: 96.6667%, auc: 0.9989\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6046%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.0396: 100%|██████████| 34/34 [00:05<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6680s, loss = 0.0396, accuracy: 99.2593%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1830s, loss: 0.0087, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7210%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.0088: 100%|██████████| 34/34 [00:05<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6499s, loss = 0.0088, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1807s, loss: 0.0036, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7046%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0059: 100%|██████████| 34/34 [00:05<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6604s, loss = 0.0059, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1826s, loss: 0.0024, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7381%\n",
      "\n",
      "Accuracy: 73.8%\n",
      "Precision: 73.9%\n",
      "Recall: 73.8%\n",
      "F1: 73.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.752     0.712     0.731       912\n",
      "     class_1      0.725     0.765     0.745       909\n",
      "\n",
      "    accuracy                          0.738      1821\n",
      "   macro avg      0.739     0.738     0.738      1821\n",
      "weighted avg      0.739     0.738     0.738      1821\n",
      "\n",
      "600\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7747, accuracy: 35.0000%, auc: 0.3092\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.3462: 100%|██████████| 34/34 [00:05<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6875s, loss = 0.3462, accuracy: 87.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1832s, loss: 0.2115, accuracy: 93.3333%, auc: 0.9844\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5475%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1555s, loss: 0.0881: 100%|██████████| 34/34 [00:05<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.7055s, loss = 0.0881, accuracy: 97.9630%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1877s, loss: 0.0249, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7100%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1543s, loss: 0.0251: 100%|██████████| 34/34 [00:05<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6753s, loss = 0.0251, accuracy: 99.6296%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.1839s, loss: 0.0091, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7265%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0088: 100%|██████████| 34/34 [00:05<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6386s, loss = 0.0088, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.1807s, loss: 0.0059, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7556%\n",
      "\n",
      "Accuracy: 75.6%\n",
      "Precision: 76.8%\n",
      "Recall: 75.5%\n",
      "F1: 75.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.711     0.864     0.780       912\n",
      "     class_1      0.826     0.647     0.725       909\n",
      "\n",
      "    accuracy                          0.756      1821\n",
      "   macro avg      0.768     0.755     0.753      1821\n",
      "weighted avg      0.768     0.756     0.753      1821\n",
      "\n",
      "600\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6516, accuracy: 58.3333%, auc: 0.7645\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.3475: 100%|██████████| 34/34 [00:05<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6701s, loss = 0.3475, accuracy: 89.8148%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.1791s, loss: 0.0833, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6420%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1547s, loss: 0.0537: 100%|██████████| 34/34 [00:05<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 5.6899s, loss = 0.0537, accuracy: 99.0741%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.1862s, loss: 0.0421, accuracy: 98.3333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 64.2%\n",
      "Precision: 70.1%\n",
      "Recall: 64.2%\n",
      "F1: 61.4%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.810     0.373     0.511       912\n",
      "     class_1      0.592     0.912     0.718       909\n",
      "\n",
      "    accuracy                          0.642      1821\n",
      "   macro avg      0.701     0.642     0.614      1821\n",
      "weighted avg      0.701     0.642     0.614      1821\n",
      "\n",
      "700\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6976, accuracy: 47.1429%, auc: 0.4890\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.2058: 100%|██████████| 40/40 [00:06<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6549s, loss = 0.2058, accuracy: 94.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2191s, loss: 0.0344, accuracy: 98.5714%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6568%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0302: 100%|██████████| 40/40 [00:06<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6579s, loss = 0.0302, accuracy: 99.5238%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2177s, loss: 0.0064, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6425%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.0080: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6297s, loss = 0.0080, accuracy: 99.8413%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2167s, loss: 0.1622, accuracy: 97.1429%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 64.3%\n",
      "Precision: 73.7%\n",
      "Recall: 64.3%\n",
      "F1: 60.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.887     0.328     0.479       912\n",
      "     class_1      0.587     0.958     0.728       909\n",
      "\n",
      "    accuracy                          0.643      1821\n",
      "   macro avg      0.737     0.643     0.603      1821\n",
      "weighted avg      0.737     0.643     0.603      1821\n",
      "\n",
      "700\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7235, accuracy: 42.8571%, auc: 0.4898\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.3304: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6245s, loss = 0.3304, accuracy: 88.7302%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2146s, loss: 0.1038, accuracy: 95.7143%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5826%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1528s, loss: 0.0445: 100%|██████████| 40/40 [00:06<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6047s, loss = 0.0445, accuracy: 99.3651%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2154s, loss: 0.0107, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6233%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1528s, loss: 0.0090: 100%|██████████| 40/40 [00:06<00:00,  6.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6092s, loss = 0.0090, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2144s, loss: 0.0032, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7013%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1532s, loss: 0.0036: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6231s, loss = 0.0036, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2147s, loss: 0.0018, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6919%\n",
      "\n",
      "Accuracy: 69.2%\n",
      "Precision: 74.4%\n",
      "Recall: 69.2%\n",
      "F1: 67.5%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.856     0.463     0.601       912\n",
      "     class_1      0.631     0.922     0.749       909\n",
      "\n",
      "    accuracy                          0.692      1821\n",
      "   macro avg      0.744     0.692     0.675      1821\n",
      "weighted avg      0.744     0.692     0.675      1821\n",
      "\n",
      "700\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6945, accuracy: 50.0000%, auc: 0.5396\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.2605: 100%|██████████| 40/40 [00:06<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6529s, loss = 0.2605, accuracy: 93.1746%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2214s, loss: 0.0373, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6222%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.0303: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6310s, loss = 0.0303, accuracy: 99.5238%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2188s, loss: 0.0057, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7556%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.0064: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6291s, loss = 0.0064, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2153s, loss: 0.0073, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6936%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1537s, loss: 0.0032: 100%|██████████| 40/40 [00:06<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6469s, loss = 0.0032, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2126s, loss: 0.0023, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7282%\n",
      "\n",
      "Accuracy: 72.8%\n",
      "Precision: 76.1%\n",
      "Recall: 72.8%\n",
      "F1: 71.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.855     0.550     0.670       912\n",
      "     class_1      0.668     0.906     0.769       909\n",
      "\n",
      "    accuracy                          0.728      1821\n",
      "   macro avg      0.761     0.728     0.719      1821\n",
      "weighted avg      0.762     0.728     0.719      1821\n",
      "\n",
      "700\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7373, accuracy: 50.0000%, auc: 0.3086\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.3411: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6286s, loss = 0.3411, accuracy: 89.0476%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2110s, loss: 0.0645, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6293%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.0601: 100%|██████████| 40/40 [00:06<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6373s, loss = 0.0601, accuracy: 98.7302%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2152s, loss: 0.0469, accuracy: 98.5714%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 62.9%\n",
      "Precision: 64.3%\n",
      "Recall: 63.0%\n",
      "F1: 62.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.689     0.474     0.561       912\n",
      "     class_1      0.598     0.785     0.679       909\n",
      "\n",
      "    accuracy                          0.629      1821\n",
      "   macro avg      0.643     0.630     0.620      1821\n",
      "weighted avg      0.644     0.629     0.620      1821\n",
      "\n",
      "700\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6835, accuracy: 52.8571%, auc: 0.7339\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.2993: 100%|██████████| 40/40 [00:06<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6605s, loss = 0.2993, accuracy: 90.6349%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2176s, loss: 0.0338, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7188%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1531s, loss: 0.0236: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6281s, loss = 0.0236, accuracy: 99.5238%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2131s, loss: 0.0058, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6233%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1531s, loss: 0.0075: 100%|██████████| 40/40 [00:06<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 6.6220s, loss = 0.0075, accuracy: 99.8413%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2185s, loss: 0.0374, accuracy: 98.5714%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 62.3%\n",
      "Precision: 74.5%\n",
      "Recall: 62.4%\n",
      "F1: 57.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.919     0.272     0.420       912\n",
      "     class_1      0.572     0.976     0.721       909\n",
      "\n",
      "    accuracy                          0.623      1821\n",
      "   macro avg      0.745     0.624     0.570      1821\n",
      "weighted avg      0.745     0.623     0.570      1821\n",
      "\n",
      "800\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7883, accuracy: 40.0000%, auc: 0.3559\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1558s, loss: 0.2470: 100%|██████████| 45/45 [00:07<00:00,  5.95it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5644s, loss = 0.2470, accuracy: 92.7778%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2507s, loss: 0.0356, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7106%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.0326: 100%|██████████| 45/45 [00:07<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5253s, loss = 0.0326, accuracy: 99.7222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2429s, loss: 0.0091, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6628%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1546s, loss: 0.0129: 100%|██████████| 45/45 [00:07<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5181s, loss = 0.0129, accuracy: 99.8611%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2465s, loss: 0.0330, accuracy: 98.7500%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 66.3%\n",
      "Precision: 72.1%\n",
      "Recall: 66.3%\n",
      "F1: 63.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.836     0.407     0.547       912\n",
      "     class_1      0.607     0.920     0.731       909\n",
      "\n",
      "    accuracy                          0.663      1821\n",
      "   macro avg      0.721     0.663     0.639      1821\n",
      "weighted avg      0.722     0.663     0.639      1821\n",
      "\n",
      "800\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7068, accuracy: 48.7500%, auc: 0.4279\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1555s, loss: 0.2507: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5451s, loss = 0.2507, accuracy: 91.3889%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2472s, loss: 0.0252, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6260%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.0354: 100%|██████████| 45/45 [00:07<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5257s, loss = 0.0354, accuracy: 99.1667%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2450s, loss: 0.0633, accuracy: 98.7500%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 62.6%\n",
      "Precision: 68.8%\n",
      "Recall: 62.6%\n",
      "F1: 59.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.795     0.341     0.477       912\n",
      "     class_1      0.580     0.912     0.709       909\n",
      "\n",
      "    accuracy                          0.626      1821\n",
      "   macro avg      0.688     0.626     0.593      1821\n",
      "weighted avg      0.688     0.626     0.593      1821\n",
      "\n",
      "800\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7361, accuracy: 52.5000%, auc: 0.3904\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.3074: 100%|██████████| 45/45 [00:07<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5271s, loss = 0.3074, accuracy: 89.7222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2473s, loss: 0.0225, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6815%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0220: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5404s, loss = 0.0220, accuracy: 99.7222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2448s, loss: 0.0074, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7650%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1554s, loss: 0.0051: 100%|██████████| 45/45 [00:07<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5530s, loss = 0.0051, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2456s, loss: 0.0023, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7479%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.0027: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5458s, loss = 0.0027, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2502s, loss: 0.0014, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7600%\n",
      "\n",
      "Accuracy: 76.0%\n",
      "Precision: 76.1%\n",
      "Recall: 76.0%\n",
      "F1: 76.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.777     0.730     0.753       912\n",
      "     class_1      0.745     0.790     0.767       909\n",
      "\n",
      "    accuracy                          0.760      1821\n",
      "   macro avg      0.761     0.760     0.760      1821\n",
      "weighted avg      0.761     0.760     0.760      1821\n",
      "\n",
      "800\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6877, accuracy: 60.0000%, auc: 0.6096\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.2233: 100%|██████████| 45/45 [00:07<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5321s, loss = 0.2233, accuracy: 94.3056%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2423s, loss: 0.0349, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6485%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.0318: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5376s, loss = 0.0318, accuracy: 99.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2458s, loss: 0.0107, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6722%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1556s, loss: 0.0115: 100%|██████████| 45/45 [00:07<00:00,  5.95it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5615s, loss = 0.0115, accuracy: 99.8611%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2407s, loss: 0.0046, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7282%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1556s, loss: 0.0052: 100%|██████████| 45/45 [00:07<00:00,  5.95it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5654s, loss = 0.0052, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2479s, loss: 0.0030, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7260%\n",
      "\n",
      "Accuracy: 72.6%\n",
      "Precision: 73.6%\n",
      "Recall: 72.6%\n",
      "F1: 72.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.784     0.625     0.696       912\n",
      "     class_1      0.687     0.827     0.751       909\n",
      "\n",
      "    accuracy                          0.726      1821\n",
      "   macro avg      0.736     0.726     0.723      1821\n",
      "weighted avg      0.736     0.726     0.723      1821\n",
      "\n",
      "800\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7006, accuracy: 47.5000%, auc: 0.7638\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1554s, loss: 0.2129: 100%|██████████| 45/45 [00:07<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5497s, loss = 0.2129, accuracy: 94.0278%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2511s, loss: 0.0679, accuracy: 98.7500%, auc: 0.9925\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7452%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0224: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5406s, loss = 0.0224, accuracy: 99.7222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2459s, loss: 0.0072, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7501%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0049: 100%|██████████| 45/45 [00:07<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5332s, loss = 0.0049, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2473s, loss: 0.0023, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7474%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.0032: 100%|██████████| 45/45 [00:07<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 7.5387s, loss = 0.0032, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2488s, loss: 0.0064, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7743%\n",
      "\n",
      "Accuracy: 77.4%\n",
      "Precision: 77.4%\n",
      "Recall: 77.4%\n",
      "F1: 77.4%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.779     0.766     0.773       912\n",
      "     class_1      0.769     0.782     0.776       909\n",
      "\n",
      "    accuracy                          0.774      1821\n",
      "   macro avg      0.774     0.774     0.774      1821\n",
      "weighted avg      0.774     0.774     0.774      1821\n",
      "\n",
      "900\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6806, accuracy: 57.7778%, auc: 0.6843\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.2128: 100%|██████████| 51/51 [00:08<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4951s, loss = 0.2128, accuracy: 92.8395%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2883s, loss: 0.0301, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6447%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.0251: 100%|██████████| 51/51 [00:08<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5380s, loss = 0.0251, accuracy: 99.6296%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2815s, loss: 0.0761, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 64.5%\n",
      "Precision: 75.6%\n",
      "Recall: 64.5%\n",
      "F1: 60.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.926     0.316     0.471       912\n",
      "     class_1      0.587     0.975     0.733       909\n",
      "\n",
      "    accuracy                          0.645      1821\n",
      "   macro avg      0.756     0.645     0.602      1821\n",
      "weighted avg      0.757     0.645     0.602      1821\n",
      "\n",
      "900\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7319, accuracy: 43.3333%, auc: 0.3676\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.2336: 100%|██████████| 51/51 [00:08<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5590s, loss = 0.2336, accuracy: 93.0864%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2827s, loss: 0.0573, accuracy: 98.8889%, auc: 0.9995\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7276%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0282: 100%|██████████| 51/51 [00:08<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4685s, loss = 0.0282, accuracy: 99.6296%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2780s, loss: 0.0549, accuracy: 98.8889%, auc: 0.9931\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7446%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0171: 100%|██████████| 51/51 [00:08<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4622s, loss = 0.0171, accuracy: 99.7531%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2794s, loss: 0.0099, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7287%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.0093: 100%|██████████| 51/51 [00:08<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4951s, loss = 0.0093, accuracy: 99.8765%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2801s, loss: 0.0891, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 72.9%\n",
      "Precision: 76.9%\n",
      "Recall: 72.9%\n",
      "F1: 71.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.875     0.535     0.664       912\n",
      "     class_1      0.664     0.923     0.773       909\n",
      "\n",
      "    accuracy                          0.729      1821\n",
      "   macro avg      0.769     0.729     0.718      1821\n",
      "weighted avg      0.770     0.729     0.718      1821\n",
      "\n",
      "900\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8031, accuracy: 51.1111%, auc: 0.2628\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1554s, loss: 0.3072: 100%|██████████| 51/51 [00:08<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5573s, loss = 0.3072, accuracy: 87.2840%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2834s, loss: 0.0812, accuracy: 97.7778%, auc: 0.9960\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5931%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1543s, loss: 0.0521: 100%|██████████| 51/51 [00:08<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5040s, loss = 0.0521, accuracy: 99.0123%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2811s, loss: 0.0269, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.5794%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0164: 100%|██████████| 51/51 [00:08<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4866s, loss = 0.0164, accuracy: 99.7531%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.2783s, loss: 0.0307, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.5530%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.0122: 100%|██████████| 51/51 [00:08<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4818s, loss = 0.0122, accuracy: 99.7531%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.2767s, loss: 0.0427, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.5761%\n",
      "\n",
      "Accuracy: 57.6%\n",
      "Precision: 71.3%\n",
      "Recall: 57.7%\n",
      "F1: 49.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.885     0.177     0.294       912\n",
      "     class_1      0.542     0.977     0.697       909\n",
      "\n",
      "    accuracy                          0.576      1821\n",
      "   macro avg      0.713     0.577     0.496      1821\n",
      "weighted avg      0.713     0.576     0.495      1821\n",
      "\n",
      "900\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7646, accuracy: 33.3333%, auc: 0.2579\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1543s, loss: 0.2658: 100%|██████████| 51/51 [00:08<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5006s, loss = 0.2658, accuracy: 92.2222%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2814s, loss: 0.0331, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7331%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1545s, loss: 0.0338: 100%|██████████| 51/51 [00:08<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5099s, loss = 0.0338, accuracy: 99.2593%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2850s, loss: 0.0204, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 73.3%\n",
      "Precision: 76.2%\n",
      "Recall: 73.3%\n",
      "F1: 72.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.850     0.567     0.680       912\n",
      "     class_1      0.674     0.900     0.771       909\n",
      "\n",
      "    accuracy                          0.733      1821\n",
      "   macro avg      0.762     0.733     0.726      1821\n",
      "weighted avg      0.762     0.733     0.726      1821\n",
      "\n",
      "900\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8057, accuracy: 41.1111%, auc: 0.2752\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.2481: 100%|██████████| 51/51 [00:08<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.5468s, loss = 0.2481, accuracy: 93.4568%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.2785s, loss: 0.0302, accuracy: 98.8889%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7655%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.0110: 100%|██████████| 51/51 [00:08<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 8.4934s, loss = 0.0110, accuracy: 100.0000%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.2775s, loss: 0.0838, accuracy: 97.7778%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 76.6%\n",
      "Precision: 77.9%\n",
      "Recall: 76.6%\n",
      "F1: 76.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.841     0.656     0.737       912\n",
      "     class_1      0.717     0.876     0.789       909\n",
      "\n",
      "    accuracy                          0.766      1821\n",
      "   macro avg      0.779     0.766     0.763      1821\n",
      "weighted avg      0.779     0.766     0.763      1821\n",
      "\n",
      "1000\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7707, accuracy: 58.0000%, auc: 0.4821\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.1819: 100%|██████████| 57/57 [00:09<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4832s, loss = 0.1819, accuracy: 93.4444%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3168s, loss: 0.1243, accuracy: 96.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6733%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1533s, loss: 0.0175: 100%|██████████| 57/57 [00:09<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4391s, loss = 0.0175, accuracy: 99.7778%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3161s, loss: 0.0063, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6837%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0051: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4748s, loss = 0.0051, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3267s, loss: 0.0035, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7133%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.0030: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4671s, loss = 0.0030, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3180s, loss: 0.0024, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7183%\n",
      "\n",
      "Accuracy: 71.8%\n",
      "Precision: 73.7%\n",
      "Recall: 71.9%\n",
      "F1: 71.3%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.803     0.580     0.673       912\n",
      "     class_1      0.670     0.857     0.752       909\n",
      "\n",
      "    accuracy                          0.718      1821\n",
      "   macro avg      0.737     0.719     0.713      1821\n",
      "weighted avg      0.737     0.718     0.713      1821\n",
      "\n",
      "1000\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7834, accuracy: 44.0000%, auc: 0.4635\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.2486: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4713s, loss = 0.2486, accuracy: 91.6667%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3171s, loss: 0.0287, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7392%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1536s, loss: 0.0225: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4595s, loss = 0.0225, accuracy: 99.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3188s, loss: 0.0678, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 73.9%\n",
      "Precision: 74.5%\n",
      "Recall: 73.9%\n",
      "F1: 73.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.783     0.663     0.718       912\n",
      "     class_1      0.707     0.815     0.757       909\n",
      "\n",
      "    accuracy                          0.739      1821\n",
      "   macro avg      0.745     0.739     0.738      1821\n",
      "weighted avg      0.745     0.739     0.738      1821\n",
      "\n",
      "1000\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7952, accuracy: 42.0000%, auc: 0.4010\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.2054: 100%|██████████| 57/57 [00:09<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4895s, loss = 0.2054, accuracy: 94.0000%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3196s, loss: 0.1099, accuracy: 96.0000%, auc: 0.9996\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7666%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0183: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4564s, loss = 0.0183, accuracy: 99.7778%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3183s, loss: 0.0601, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7705%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1536s, loss: 0.0151: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4626s, loss = 0.0151, accuracy: 99.7778%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3245s, loss: 0.0543, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6766%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.0084: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4784s, loss = 0.0084, accuracy: 99.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3184s, loss: 0.0049, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.5931%\n",
      "\n",
      "Accuracy: 59.3%\n",
      "Precision: 76.2%\n",
      "Recall: 59.4%\n",
      "F1: 51.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.972     0.193     0.322       912\n",
      "     class_1      0.551     0.994     0.709       909\n",
      "\n",
      "    accuracy                          0.593      1821\n",
      "   macro avg      0.762     0.594     0.516      1821\n",
      "weighted avg      0.762     0.593     0.515      1821\n",
      "\n",
      "1000\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7777, accuracy: 44.0000%, auc: 0.2330\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1543s, loss: 0.2242: 100%|██████████| 57/57 [00:09<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4977s, loss = 0.2242, accuracy: 92.7778%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3206s, loss: 0.0543, accuracy: 98.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7227%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.0200: 100%|██████████| 57/57 [00:09<00:00,  6.04it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4406s, loss = 0.0200, accuracy: 99.5556%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3182s, loss: 0.0560, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7710%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0194: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4573s, loss = 0.0194, accuracy: 99.2222%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3210s, loss: 0.1991, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7304%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1538s, loss: 0.0072: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4641s, loss = 0.0072, accuracy: 99.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3263s, loss: 0.0097, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6639%\n",
      "\n",
      "Accuracy: 66.4%\n",
      "Precision: 74.4%\n",
      "Recall: 66.4%\n",
      "F1: 63.4%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.885     0.378     0.530       912\n",
      "     class_1      0.604     0.950     0.738       909\n",
      "\n",
      "    accuracy                          0.664      1821\n",
      "   macro avg      0.744     0.664     0.634      1821\n",
      "weighted avg      0.744     0.664     0.634      1821\n",
      "\n",
      "1000\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7048, accuracy: 56.0000%, auc: 0.4554\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.2227: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4779s, loss = 0.2227, accuracy: 92.1111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3174s, loss: 0.0690, accuracy: 98.0000%, auc: 0.9996\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7529%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1534s, loss: 0.0304: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4536s, loss = 0.0304, accuracy: 99.3333%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3200s, loss: 0.0473, accuracy: 99.0000%, auc: 0.9984\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7430%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1535s, loss: 0.0175: 100%|██████████| 57/57 [00:09<00:00,  6.03it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4550s, loss = 0.0175, accuracy: 99.6667%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3184s, loss: 0.0321, accuracy: 99.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6085%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0052: 100%|██████████| 57/57 [00:09<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 9.4780s, loss = 0.0052, accuracy: 99.8889%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3156s, loss: 0.0545, accuracy: 99.0000%, auc: 0.9992\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7122%\n",
      "\n",
      "Accuracy: 71.2%\n",
      "Precision: 75.7%\n",
      "Recall: 71.3%\n",
      "F1: 69.9%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.865     0.504     0.637       912\n",
      "     class_1      0.649     0.921     0.762       909\n",
      "\n",
      "    accuracy                          0.712      1821\n",
      "   macro avg      0.757     0.713     0.699      1821\n",
      "weighted avg      0.757     0.712     0.699      1821\n",
      "\n",
      "1100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7560, accuracy: 43.6364%, auc: 0.2982\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.2189: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3959s, loss = 0.2189, accuracy: 92.0202%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3399s, loss: 0.0149, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7133%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.0245: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3712s, loss = 0.0245, accuracy: 99.4949%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3396s, loss: 0.0035, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7672%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.0080: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3709s, loss = 0.0080, accuracy: 99.8990%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3455s, loss: 0.0017, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7501%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.0128: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3772s, loss = 0.0128, accuracy: 99.7980%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3399s, loss: 0.0015, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6513%\n",
      "\n",
      "Accuracy: 65.1%\n",
      "Precision: 77.8%\n",
      "Recall: 65.2%\n",
      "F1: 60.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.966     0.315     0.475       912\n",
      "     class_1      0.590     0.989     0.739       909\n",
      "\n",
      "    accuracy                          0.651      1821\n",
      "   macro avg      0.778     0.652     0.607      1821\n",
      "weighted avg      0.778     0.651     0.607      1821\n",
      "\n",
      "1100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6809, accuracy: 54.5455%, auc: 0.6628\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.1942: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3850s, loss = 0.1942, accuracy: 94.6465%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3391s, loss: 0.0115, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7644%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.0337: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3722s, loss = 0.0337, accuracy: 98.9899%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3438s, loss: 0.0069, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7507%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.0098: 100%|██████████| 62/62 [00:10<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.4070s, loss = 0.0098, accuracy: 99.7980%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3426s, loss: 0.0019, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7271%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1547s, loss: 0.0020: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3649s, loss = 0.0020, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3454s, loss: 0.0012, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7534%\n",
      "\n",
      "Accuracy: 75.3%\n",
      "Precision: 78.4%\n",
      "Recall: 75.4%\n",
      "F1: 74.7%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.876     0.591     0.706       912\n",
      "     class_1      0.691     0.916     0.788       909\n",
      "\n",
      "    accuracy                          0.753      1821\n",
      "   macro avg      0.784     0.754     0.747      1821\n",
      "weighted avg      0.784     0.753     0.747      1821\n",
      "\n",
      "1100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6608, accuracy: 70.9091%, auc: 0.7038\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.1883: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3784s, loss = 0.1883, accuracy: 94.5455%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3370s, loss: 0.0160, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7523%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.0219: 100%|██████████| 62/62 [00:10<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3980s, loss = 0.0219, accuracy: 99.3939%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3467s, loss: 0.0026, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7759%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0130: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3890s, loss = 0.0130, accuracy: 99.6970%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3425s, loss: 0.0019, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7639%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.0022: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3765s, loss = 0.0022, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3403s, loss: 0.0010, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.6656%\n",
      "\n",
      "Accuracy: 66.6%\n",
      "Precision: 76.2%\n",
      "Recall: 66.6%\n",
      "F1: 63.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.922     0.363     0.521       912\n",
      "     class_1      0.603     0.969     0.743       909\n",
      "\n",
      "    accuracy                          0.666      1821\n",
      "   macro avg      0.762     0.666     0.632      1821\n",
      "weighted avg      0.763     0.666     0.632      1821\n",
      "\n",
      "1100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6759, accuracy: 55.4545%, auc: 0.6139\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1550s, loss: 0.2050: 100%|██████████| 62/62 [00:10<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3790s, loss = 0.2050, accuracy: 94.0404%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3456s, loss: 0.0412, accuracy: 99.0909%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6568%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1553s, loss: 0.0180: 100%|██████████| 62/62 [00:10<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3981s, loss = 0.0180, accuracy: 99.5960%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3407s, loss: 0.0030, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7337%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.0053: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3856s, loss = 0.0053, accuracy: 99.8990%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3427s, loss: 0.0019, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6463%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.0025: 100%|██████████| 62/62 [00:10<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3622s, loss = 0.0025, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3402s, loss: 0.0009, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7705%\n",
      "\n",
      "Accuracy: 77.0%\n",
      "Precision: 77.2%\n",
      "Recall: 77.0%\n",
      "F1: 77.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.750     0.812     0.780       912\n",
      "     class_1      0.795     0.728     0.760       909\n",
      "\n",
      "    accuracy                          0.770      1821\n",
      "   macro avg      0.772     0.770     0.770      1821\n",
      "weighted avg      0.772     0.770     0.770      1821\n",
      "\n",
      "1100\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.8892, accuracy: 50.9091%, auc: 0.3421\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1556s, loss: 0.2217: 100%|██████████| 62/62 [00:10<00:00,  5.96it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.4110s, loss = 0.2217, accuracy: 92.7273%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3397s, loss: 0.0508, accuracy: 99.0909%, auc: 0.9993\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7095%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1552s, loss: 0.0228: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3943s, loss = 0.0228, accuracy: 99.4949%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3435s, loss: 0.0052, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7913%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1551s, loss: 0.0123: 100%|██████████| 62/62 [00:10<00:00,  5.97it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 10.3876s, loss = 0.0123, accuracy: 99.6970%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3418s, loss: 0.0567, accuracy: 99.0909%, auc: 0.9997\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 79.1%\n",
      "Precision: 79.2%\n",
      "Recall: 79.1%\n",
      "F1: 79.1%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.800     0.779     0.789       912\n",
      "     class_1      0.783     0.804     0.794       909\n",
      "\n",
      "    accuracy                          0.791      1821\n",
      "   macro avg      0.792     0.791     0.791      1821\n",
      "weighted avg      0.792     0.791     0.791      1821\n",
      "\n",
      "1200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7197, accuracy: 41.6667%, auc: 0.2991\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1546s, loss: 0.2444: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3604s, loss = 0.2444, accuracy: 90.9259%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3801s, loss: 0.0203, accuracy: 99.1667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.6337%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1536s, loss: 0.0159: 100%|██████████| 68/68 [00:11<00:00,  6.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3042s, loss = 0.0159, accuracy: 99.6296%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3762s, loss: 0.0096, accuracy: 99.1667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.6002%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.0029: 100%|██████████| 68/68 [00:11<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3269s, loss = 0.0029, accuracy: 100.0000%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3830s, loss: 0.0025, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.6359%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1546s, loss: 0.0016: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3603s, loss = 0.0016, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3845s, loss: 0.0008, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7095%\n",
      "\n",
      "Accuracy: 71.0%\n",
      "Precision: 75.5%\n",
      "Recall: 71.0%\n",
      "F1: 69.6%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.862     0.500     0.633       912\n",
      "     class_1      0.647     0.920     0.760       909\n",
      "\n",
      "    accuracy                          0.710      1821\n",
      "   macro avg      0.755     0.710     0.696      1821\n",
      "weighted avg      0.755     0.710     0.696      1821\n",
      "\n",
      "1200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7240, accuracy: 41.6667%, auc: 0.4129\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.2185: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3500s, loss = 0.2185, accuracy: 93.6111%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3762s, loss: 0.0184, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7117%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.0385: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3342s, loss = 0.0385, accuracy: 98.9815%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3768s, loss: 0.0048, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7128%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1543s, loss: 0.0059: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3376s, loss = 0.0059, accuracy: 99.9074%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3858s, loss: 0.0019, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7331%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1546s, loss: 0.0020: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3596s, loss = 0.0020, accuracy: 100.0000%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3842s, loss: 0.0011, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7337%\n",
      "\n",
      "Accuracy: 73.4%\n",
      "Precision: 76.7%\n",
      "Recall: 73.4%\n",
      "F1: 72.5%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.862     0.557     0.677       912\n",
      "     class_1      0.672     0.911     0.773       909\n",
      "\n",
      "    accuracy                          0.734      1821\n",
      "   macro avg      0.767     0.734     0.725      1821\n",
      "weighted avg      0.767     0.734     0.725      1821\n",
      "\n",
      "1200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.7373, accuracy: 50.0000%, auc: 0.4316\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.1538: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3457s, loss = 0.1538, accuracy: 95.0926%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3792s, loss: 0.0554, accuracy: 98.3333%, auc: 0.9994\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.5837%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1540s, loss: 0.0231: 100%|██████████| 68/68 [00:11<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3146s, loss = 0.0231, accuracy: 99.7222%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3792s, loss: 0.0116, accuracy: 99.1667%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7430%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1545s, loss: 0.0208: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3462s, loss = 0.0208, accuracy: 99.4444%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3852s, loss: 0.0839, accuracy: 98.3333%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 74.3%\n",
      "Precision: 76.4%\n",
      "Recall: 74.3%\n",
      "F1: 73.8%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.838     0.603     0.702       912\n",
      "     class_1      0.689     0.883     0.774       909\n",
      "\n",
      "    accuracy                          0.743      1821\n",
      "   macro avg      0.764     0.743     0.738      1821\n",
      "weighted avg      0.764     0.743     0.738      1821\n",
      "\n",
      "1200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6960, accuracy: 53.3333%, auc: 0.5823\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1548s, loss: 0.1860: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3596s, loss = 0.1860, accuracy: 93.2407%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3796s, loss: 0.0085, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7386%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1541s, loss: 0.0207: 100%|██████████| 68/68 [00:11<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3213s, loss = 0.0207, accuracy: 99.6296%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3770s, loss: 0.0032, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7765%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1539s, loss: 0.0067: 100%|██████████| 68/68 [00:11<00:00,  6.01it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3140s, loss = 0.0067, accuracy: 99.8148%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3808s, loss: 0.0018, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7501%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.0038: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3407s, loss = 0.0038, accuracy: 99.9074%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3877s, loss: 0.0012, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 4:\n",
      "Test accuracy: 0.7655%\n",
      "\n",
      "Accuracy: 76.6%\n",
      "Precision: 78.4%\n",
      "Recall: 76.6%\n",
      "F1: 76.2%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.857     0.638     0.732       912\n",
      "     class_1      0.711     0.893     0.792       909\n",
      "\n",
      "    accuracy                          0.766      1821\n",
      "   macro avg      0.784     0.766     0.762      1821\n",
      "weighted avg      0.784     0.766     0.762      1821\n",
      "\n",
      "1200\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google-bert/bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
      "/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "====================  Preparing for training  ====================\n",
      "\t* Loading training data...\n",
      "\t* Loading validation data...\n",
      "\t* Loading test data...\n",
      "\t* Building model...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:591: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "* Validation loss before training: 0.6804, accuracy: 58.3333%, auc: 0.6010\n",
      "\n",
      " ==================== Training bert model on device: cuda ====================\n",
      "* Training epoch 1:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1549s, loss: 0.1659: 100%|██████████| 68/68 [00:11<00:00,  5.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3664s, loss = 0.1659, accuracy: 95.0926%\n",
      "* Validation for epoch 1:\n",
      "-> Valid. time: 0.3908s, loss: 0.0085, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 1:\n",
      "Test accuracy: 0.7573%\n",
      "\n",
      "* Training epoch 2:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.0231: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3431s, loss = 0.0231, accuracy: 99.4444%\n",
      "* Validation for epoch 2:\n",
      "-> Valid. time: 0.3832s, loss: 0.0035, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 2:\n",
      "Test accuracy: 0.7754%\n",
      "\n",
      "* Training epoch 3:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1544s, loss: 0.0041: 100%|██████████| 68/68 [00:11<00:00,  5.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3468s, loss = 0.0041, accuracy: 99.9074%\n",
      "* Validation for epoch 3:\n",
      "-> Valid. time: 0.3760s, loss: 0.0035, accuracy: 100.0000%, auc: 1.0000\n",
      "\n",
      "save model succesfully!\n",
      "\n",
      "* Test for epoch 3:\n",
      "Test accuracy: 0.7529%\n",
      "\n",
      "* Training epoch 4:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Avg. batch proc. time: 0.1542s, loss: 0.0077: 100%|██████████| 68/68 [00:11<00:00,  6.00it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-> Training time: 11.3326s, loss = 0.0077, accuracy: 99.9074%\n",
      "* Validation for epoch 4:\n",
      "-> Valid. time: 0.3841s, loss: 0.0102, accuracy: 99.1667%, auc: 1.0000\n",
      "\n",
      "-> Early stopping: patience limit reached, stopping...\n",
      "Accuracy: 75.3%\n",
      "Precision: 76.5%\n",
      "Recall: 75.3%\n",
      "F1: 75.0%\n",
      "classification_report:\n",
      "\n",
      "              precision    recall  f1-score   support\n",
      "\n",
      "     class_0      0.821     0.648     0.724       912\n",
      "     class_1      0.708     0.858     0.776       909\n",
      "\n",
      "    accuracy                          0.753      1821\n",
      "   macro avg      0.765     0.753     0.750      1821\n",
      "weighted avg      0.765     0.753     0.750      1821\n",
      "\n"
     ]
    }
   ],
   "source": [
    "rand_k_results_df = pd.DataFrame(columns=['K', 'acc', 'f1'])\n",
    "results_save_name = f\"rand_k_results-{datestr}.csv\"\n",
    "\n",
    "for K in Ks:\n",
    "  # Pull even numbers of positive and negative samples\n",
    "  pos_samples = pos_syn_df.sample(n=K//2, random_state=42)\n",
    "  neg_samples = neg_syn_df.sample(n=K//2, random_state=42)\n",
    "\n",
    "  data_df = pd.concat([pos_samples, neg_samples])\n",
    "  # data_df = data_df.drop(columns=['embedding'])\n",
    "  for i in range(NUM_REPS):\n",
    "    acc, f1 = train_model_random(K, data_df, test_df, target_dir)\n",
    "    rand_k_results_df = pd.concat([rand_k_results_df, pd.DataFrame({'K': K, 'acc': [acc], 'f1': [f1]})], ignore_index=True)\n",
    "  rand_k_results_df.to_csv(os.path.join(target_dir, results_save_name))"
   ]
  }
 ],
 "metadata": {
  "accelerator": "GPU",
  "colab": {
   "gpuType": "L4",
   "machine_shape": "hm",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  },
  "varInspector": {
   "cols": {
    "lenName": 16,
    "lenType": 16,
    "lenVar": 40
   },
   "kernels_config": {
    "python": {
     "delete_cmd_postfix": "",
     "delete_cmd_prefix": "del ",
     "library": "var_list.py",
     "varRefreshCmd": "print(var_dic_list())"
    },
    "r": {
     "delete_cmd_postfix": ") ",
     "delete_cmd_prefix": "rm(",
     "library": "var_list.r",
     "varRefreshCmd": "cat(var_dic_list()) "
    }
   },
   "types_to_exclude": [
    "module",
    "function",
    "builtin_function_or_method",
    "instance",
    "_Feature"
   ],
   "window_display": false
  },
  "widgets": {
   "application/vnd.jupyter.widget-state+json": {
    "02edcbf7bbc249a29ad244b0428531a8": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "0826f510218b466eb1845043abcc4130": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_516971a7b62b4945a6fa34e65d099f69",
       "IPY_MODEL_2473829b9c2742b9b7c2e093a930bcdf",
       "IPY_MODEL_7257ed6000954b09b13c63c136715882"
      ],
      "layout": "IPY_MODEL_81b9b9bece6a4337a7cf8e6b9017feec"
     }
    },
    "09f10b2958e842f3ab7e18035efdf75d": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_d95cc2c3c9a443afbc9a8ca768fc8007",
       "IPY_MODEL_af3da40cc65649c89236a8a37a2eb3ea",
       "IPY_MODEL_1a67f5ffeb9746a3a37883dec437e968"
      ],
      "layout": "IPY_MODEL_57e6bc8f31b84afa92732ea307d3942f"
     }
    },
    "0c72b6cbae2a4a5088f6f750f657ba72": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "0d1e360d2139470c807f04fc1b46f221": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "129e20221232419bbc3533cbab76fa93": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_663506a165b1427796274d381d366123",
      "max": 440449768,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_b02bd446fd2d48ad8951ccfa02a59cf8",
      "value": 440449768
     }
    },
    "15880d1eafff4e8885ec11fc66eb20ec": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "1991f4cbf9d5438e83fad021c2677972": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_a53848f15e4a4ac5ae6cb2deb30f1da5",
      "placeholder": "​",
      "style": "IPY_MODEL_2a98e22cdc8b4b338aeccf00c76500e1",
      "value": " 440M/440M [00:01&lt;00:00, 506MB/s]"
     }
    },
    "1a67f5ffeb9746a3a37883dec437e968": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_309413fde8764de2b13567284e472aa4",
      "placeholder": "​",
      "style": "IPY_MODEL_7828c2d9620d47d982c83d7f826325d8",
      "value": " 232k/232k [00:00&lt;00:00, 10.8MB/s]"
     }
    },
    "1f32563781234251ab589618c62441ee": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "2473829b9c2742b9b7c2e093a930bcdf": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_9d9c9ab3a1ad4e58addb885271776867",
      "max": 48,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_9bac258e5421495298ec04d03c9cfc47",
      "value": 48
     }
    },
    "2a98e22cdc8b4b338aeccf00c76500e1": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "309413fde8764de2b13567284e472aa4": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "316d53715c7d4c179c41422ece261a2b": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "3711473f681a489297a32650a74fa2c2": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_ff33a45708ae4331beb0a037de6e42bb",
       "IPY_MODEL_6525bad8ac6743f0ae5bc7fa4b6842f3",
       "IPY_MODEL_ef73adeea2034e36b82a721bde5fe6ed"
      ],
      "layout": "IPY_MODEL_a305e6d37d4d48028dd90f4eb5f8f2b1"
     }
    },
    "44f88c1a61f146ee9ba2d85c98286d5c": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "4576e26b03794806a18db8960f77f3ea": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "516971a7b62b4945a6fa34e65d099f69": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_90fc6dcd85f84a3ea7a65d561f9a868e",
      "placeholder": "​",
      "style": "IPY_MODEL_316d53715c7d4c179c41422ece261a2b",
      "value": "tokenizer_config.json: 100%"
     }
    },
    "57e6bc8f31b84afa92732ea307d3942f": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "582cc43ffa344802b78bbf47c7dcfb6f": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "5a119b8b191d42879f23a320a5002ce4": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_714320b450f44064994d2d797ecf3a77",
      "placeholder": "​",
      "style": "IPY_MODEL_582cc43ffa344802b78bbf47c7dcfb6f",
      "value": "model.safetensors: 100%"
     }
    },
    "5ef28d4b85c446698225f093d90f1bac": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "5f5833d9c53b4d43b40ef63b2824704e": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "63f42b7ff026482a93efac91478215e4": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "6525bad8ac6743f0ae5bc7fa4b6842f3": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_4576e26b03794806a18db8960f77f3ea",
      "max": 570,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_996ecf66ca0a4080b03f5fe08a3799c5",
      "value": 570
     }
    },
    "663506a165b1427796274d381d366123": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "714320b450f44064994d2d797ecf3a77": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "7257ed6000954b09b13c63c136715882": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_ace708058b7946c680e4ea72a992269c",
      "placeholder": "​",
      "style": "IPY_MODEL_8fda0d670095475cbfb0e0476365904b",
      "value": " 48.0/48.0 [00:00&lt;00:00, 4.09kB/s]"
     }
    },
    "72dd61e0324a4d64b7701473712b1ef2": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_ae9a1b61dfd64d2dae92f6a671ec1763",
      "placeholder": "​",
      "style": "IPY_MODEL_63f42b7ff026482a93efac91478215e4",
      "value": "tokenizer.json: 100%"
     }
    },
    "7828c2d9620d47d982c83d7f826325d8": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "80a1bd7652e74a4e95557db515e2adce": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "81b9b9bece6a4337a7cf8e6b9017feec": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "8fda0d670095475cbfb0e0476365904b": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "90606f8bed0146adb43a136f0ea72b17": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "90fc6dcd85f84a3ea7a65d561f9a868e": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "9260c4eced3f4053bbe3e553b6c54978": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_5a119b8b191d42879f23a320a5002ce4",
       "IPY_MODEL_129e20221232419bbc3533cbab76fa93",
       "IPY_MODEL_1991f4cbf9d5438e83fad021c2677972"
      ],
      "layout": "IPY_MODEL_44f88c1a61f146ee9ba2d85c98286d5c"
     }
    },
    "996ecf66ca0a4080b03f5fe08a3799c5": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "9bac258e5421495298ec04d03c9cfc47": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "9d9c9ab3a1ad4e58addb885271776867": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "9e64068e1aed4268971e33425aebb79a": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "a305e6d37d4d48028dd90f4eb5f8f2b1": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "a53848f15e4a4ac5ae6cb2deb30f1da5": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "ace708058b7946c680e4ea72a992269c": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "ae9a1b61dfd64d2dae92f6a671ec1763": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "af3da40cc65649c89236a8a37a2eb3ea": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_90606f8bed0146adb43a136f0ea72b17",
      "max": 231508,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_80a1bd7652e74a4e95557db515e2adce",
      "value": 231508
     }
    },
    "b02bd446fd2d48ad8951ccfa02a59cf8": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "b13e0504180649828cd2924f8c56a58a": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_5ef28d4b85c446698225f093d90f1bac",
      "max": 466062,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_02edcbf7bbc249a29ad244b0428531a8",
      "value": 466062
     }
    },
    "b25d0ebb00ce4d2aa4840169353e6e6b": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "bc166cef93ec4221882275fcf3b9ac6b": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_9e64068e1aed4268971e33425aebb79a",
      "placeholder": "​",
      "style": "IPY_MODEL_e2344bcd967a46c98edcb30d83b736c7",
      "value": " 466k/466k [00:00&lt;00:00, 30.2MB/s]"
     }
    },
    "bcec675da8d54fdbb8b215b2bc309e2b": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "d95cc2c3c9a443afbc9a8ca768fc8007": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_0d1e360d2139470c807f04fc1b46f221",
      "placeholder": "​",
      "style": "IPY_MODEL_5f5833d9c53b4d43b40ef63b2824704e",
      "value": "vocab.txt: 100%"
     }
    },
    "e2344bcd967a46c98edcb30d83b736c7": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "e36d0c0249674223af00ab11b891dba1": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_72dd61e0324a4d64b7701473712b1ef2",
       "IPY_MODEL_b13e0504180649828cd2924f8c56a58a",
       "IPY_MODEL_bc166cef93ec4221882275fcf3b9ac6b"
      ],
      "layout": "IPY_MODEL_bcec675da8d54fdbb8b215b2bc309e2b"
     }
    },
    "ef73adeea2034e36b82a721bde5fe6ed": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_b25d0ebb00ce4d2aa4840169353e6e6b",
      "placeholder": "​",
      "style": "IPY_MODEL_15880d1eafff4e8885ec11fc66eb20ec",
      "value": " 570/570 [00:00&lt;00:00, 46.5kB/s]"
     }
    },
    "ff33a45708ae4331beb0a037de6e42bb": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_0c72b6cbae2a4a5088f6f750f657ba72",
      "placeholder": "​",
      "style": "IPY_MODEL_1f32563781234251ab589618c62441ee",
      "value": "config.json: 100%"
     }
    }
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
