{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from rdkit import Chem\n",
    "from rdkit.Chem import AllChem\n",
    "import chemprop"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Skipped loading some Tensorflow models, missing a dependency. No module named 'tensorflow'\n",
      "Skipped loading modules with pytorch-geometric dependency, missing a dependency. No module named 'torch_geometric'\n",
      "Skipped loading modules with pytorch-geometric dependency, missing a dependency. cannot import name 'DMPNN' from 'deepchem.models.torch_models' (/home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/deepchem/models/torch_models/__init__.py)\n",
      "Skipped loading modules with pytorch-lightning dependency, missing a dependency. No module named 'pytorch_lightning'\n",
      "Skipped loading some Jax models, missing a dependency. No module named 'jax'\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append('../../../../code')\n",
    "\n",
    "from metrics import get_lo_metrics\n",
    "\n",
    "def chemprop_prepare_df(original_data):\n",
    "    result = pd.DataFrame({\n",
    "        'smiles': original_data['smiles'],\n",
    "        'targets': original_data['value'].astype(float)\n",
    "    })\n",
    "    return result\n",
    "\n",
    "def chemprop_process_folder(input_path, output_path):\n",
    "    files = ['train_1.csv', 'train_2.csv', 'train_3.csv', 'test_1.csv', 'test_2.csv', 'test_3.csv']\n",
    "    for file in files:\n",
    "        input_data = pd.read_csv(input_path + file)\n",
    "        output_data = chemprop_prepare_df(input_data)\n",
    "        output_data.to_csv(output_path + file, index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>smiles</th>\n",
       "      <th>value</th>\n",
       "      <th>cluster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>C/C(=N\\OC(C)C)c1ccc2c(c1)c1c3c(c4c(c1n2CC(C)C)...</td>\n",
       "      <td>7.897940</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>C/C(=N\\OCC(C)C)c1ccc2[nH]c3c4c(c5c(c3c2c1)CNC5...</td>\n",
       "      <td>8.129819</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>C=CC(=O)Nc1cc2c(Nc3c(F)cc(Br)cc3F)ncnc2cc1OCC1...</td>\n",
       "      <td>6.826814</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>C=CC(=O)Nc1cc2c(Nc3cc(Cl)c(Br)cc3F)ncnc2cc1OCC...</td>\n",
       "      <td>6.376751</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>C=CC(=O)Nc1cc2c(Nc3cc(Cl)c(Cl)cc3Cl)ncnc2cc1OC...</td>\n",
       "      <td>6.102373</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>495</th>\n",
       "      <td>495</td>\n",
       "      <td>c1ccc(-c2ccc(Nc3nnc(-c4cccnc4CCc4ccncc4)o3)cc2...</td>\n",
       "      <td>5.579879</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>496</th>\n",
       "      <td>496</td>\n",
       "      <td>c1ccc(Nc2ncc3c(n2)-c2ccccc2SC3)cc1</td>\n",
       "      <td>5.086133</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>497</th>\n",
       "      <td>497</td>\n",
       "      <td>c1ccc(Oc2ccc(Nc3ncnc4ccccc34)cc2)cc1</td>\n",
       "      <td>5.565271</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>498</th>\n",
       "      <td>498</td>\n",
       "      <td>c1ccc2c(c1)c(-c1cncc(-c3ccsc3)c1)cn2CCN1CCOCC1</td>\n",
       "      <td>7.214670</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>499</th>\n",
       "      <td>499</td>\n",
       "      <td>c1ccc2c3c([nH]c2c1)-c1n[nH]cc1CCC3</td>\n",
       "      <td>6.135953</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>500 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                             smiles     value  \\\n",
       "0             0  C/C(=N\\OC(C)C)c1ccc2c(c1)c1c3c(c4c(c1n2CC(C)C)...  7.897940   \n",
       "1             1  C/C(=N\\OCC(C)C)c1ccc2[nH]c3c4c(c5c(c3c2c1)CNC5...  8.129819   \n",
       "2             2  C=CC(=O)Nc1cc2c(Nc3c(F)cc(Br)cc3F)ncnc2cc1OCC1...  6.826814   \n",
       "3             3  C=CC(=O)Nc1cc2c(Nc3cc(Cl)c(Br)cc3F)ncnc2cc1OCC...  6.376751   \n",
       "4             4  C=CC(=O)Nc1cc2c(Nc3cc(Cl)c(Cl)cc3Cl)ncnc2cc1OC...  6.102373   \n",
       "..          ...                                                ...       ...   \n",
       "495         495  c1ccc(-c2ccc(Nc3nnc(-c4cccnc4CCc4ccncc4)o3)cc2...  5.579879   \n",
       "496         496                 c1ccc(Nc2ncc3c(n2)-c2ccccc2SC3)cc1  5.086133   \n",
       "497         497               c1ccc(Oc2ccc(Nc3ncnc4ccccc34)cc2)cc1  5.565271   \n",
       "498         498     c1ccc2c(c1)c(-c1cncc(-c3ccsc3)c1)cn2CCN1CCOCC1  7.214670   \n",
       "499         499                 c1ccc2c3c([nH]c2c1)-c1n[nH]cc1CCC3  6.135953   \n",
       "\n",
       "     cluster  \n",
       "0          0  \n",
       "1          0  \n",
       "2          0  \n",
       "3          0  \n",
       "4          0  \n",
       "..       ...  \n",
       "495        0  \n",
       "496        0  \n",
       "497        0  \n",
       "498        0  \n",
       "499        0  \n",
       "\n",
       "[500 rows x 4 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "train = pd.read_csv('../../../../data/lo/kdr/train_1.csv')\n",
    "test = pd.read_csv('../../../../data/lo/kdr/test_1.csv')\n",
    "\n",
    "train"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import os\n",
    "import shutil\n",
    "\n",
    "temp_datapath = '/tmp/chemprop/'\n",
    "if os.path.exists(temp_datapath) and os.path.isdir(temp_datapath):\n",
    "    shutil.rmtree(temp_datapath)\n",
    "os.mkdir(temp_datapath)\n",
    "\n",
    "input_paths = [\n",
    "    '/home/simon/papers/lohi/data/lo/kdr/'\n",
    "]\n",
    "\n",
    "output_paths = [\n",
    "    temp_datapath\n",
    "]\n",
    "\n",
    "for i in range(len(input_paths)):\n",
    "    chemprop_process_folder(input_paths[i], output_paths[i])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "base_arguments = [\n",
    "    '--dataset_type', 'regression', \n",
    "    '--data_path', temp_datapath + 'train_1.csv',\n",
    "    '--separate_val_path', temp_datapath + 'test_1.csv',\n",
    "    '--separate_test_path', temp_datapath + 'test_1.csv',\n",
    "    '--save_preds',\n",
    "    '--metric', 'mae',\n",
    "    '--epochs', '50',\n",
    "    '--gpu', '0',\n",
    "    '--save_dir', temp_datapath + 'checkpoint',\n",
    "    '--features_generator', 'rdkit_2d_normalized',\n",
    "    '--no_features_scaling',\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "param_dict = {\n",
    "    '--depth': ['3', '4', '5', '6'],\n",
    "    '--dropout': ['0.0', '0.2', '0.3', '0.5', '0.7'],\n",
    "    '--ffn_hidden_size': ['600', '1200', '2400', '3600'],\n",
    "    '--ffn_num_layers': ['1', '2', '3'],\n",
    "    '--hidden_size': ['600', '1200', '2400', '3600']\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "0it [00:00, ?it/s]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 2,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 0\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '2', '--ffn_hidden_size': '600', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 369672.48it/s]\n",
      "100%|██████████| 500/500 [00:12<00:00, 39.52it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 146982.90it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 217272.50it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 35.32it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 253760.33it/s]\n",
      "437it [00:00, 400811.47it/s]\n",
      "100%|██████████| 437/437 [00:10<00:00, 41.68it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 245665.57it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 4,059,601\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3323e+00, PNorm = 59.7291, GNorm = 7.4656, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938956\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8528e-01, PNorm = 59.8093, GNorm = 3.2272, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893636\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3525e-01, PNorm = 59.8936, GNorm = 7.3429, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.972523\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2200e-01, PNorm = 59.9475, GNorm = 5.6939, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913559\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9102e-01, PNorm = 59.9817, GNorm = 3.5591, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933988\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8716e-01, PNorm = 60.0049, GNorm = 1.8725, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902540\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6062e-01, PNorm = 60.0240, GNorm = 3.2817, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877216\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2222e-01, PNorm = 60.0447, GNorm = 5.2732, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871416\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1349e-01, PNorm = 60.0635, GNorm = 2.2205, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876379\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9666e-01, PNorm = 60.0862, GNorm = 3.1442, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876784\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3381e-01, PNorm = 60.1089, GNorm = 1.9817, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879141\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4047e-01, PNorm = 60.1249, GNorm = 2.3574, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874728\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1923e-01, PNorm = 60.1469, GNorm = 2.8225, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881744\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3017e-01, PNorm = 60.1638, GNorm = 1.7330, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883593\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5033e-01, PNorm = 60.1828, GNorm = 2.6733, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897671\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1117e-01, PNorm = 60.2029, GNorm = 1.6168, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881171\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6427e-01, PNorm = 60.2215, GNorm = 3.9240, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881821\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7487e-01, PNorm = 60.2394, GNorm = 2.0914, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865934\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5669e-01, PNorm = 60.2585, GNorm = 2.2339, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891404\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1420e-01, PNorm = 60.2784, GNorm = 2.6547, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883498\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6986e-01, PNorm = 60.2960, GNorm = 2.1602, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876866\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1776e-01, PNorm = 60.3127, GNorm = 1.6608, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895808\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1827e-01, PNorm = 60.3310, GNorm = 2.2567, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909626\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3908e-01, PNorm = 60.3482, GNorm = 1.8731, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915937\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3309e-01, PNorm = 60.3696, GNorm = 4.3985, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890483\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0393e-01, PNorm = 60.3893, GNorm = 1.5065, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881955\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0910e-01, PNorm = 60.4096, GNorm = 2.5458, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889915\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8514e-01, PNorm = 60.4276, GNorm = 5.6164, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884908\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3808e-01, PNorm = 60.4454, GNorm = 3.2600, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893296\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6060e-01, PNorm = 60.4635, GNorm = 5.8166, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938376\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5879e-01, PNorm = 60.4820, GNorm = 1.7457, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891736\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4382e-01, PNorm = 60.5016, GNorm = 2.5296, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883996\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2453e-01, PNorm = 60.5177, GNorm = 1.6179, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895191\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3787e-01, PNorm = 60.5340, GNorm = 4.8065, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.944952\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1145e-01, PNorm = 60.5498, GNorm = 1.7221, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882615\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0352e-01, PNorm = 60.5650, GNorm = 2.7828, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904702\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9178e-01, PNorm = 60.5808, GNorm = 4.7978, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897472\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2642e-01, PNorm = 60.5951, GNorm = 4.2923, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900254\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8665e-01, PNorm = 60.6095, GNorm = 2.8636, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891942\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6549e-01, PNorm = 60.6228, GNorm = 5.4696, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874010\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8363e-01, PNorm = 60.6347, GNorm = 7.3188, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876814\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2703e-01, PNorm = 60.6468, GNorm = 3.5549, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870337\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0669e-01, PNorm = 60.6597, GNorm = 2.7948, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916905\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4816e-01, PNorm = 60.6716, GNorm = 2.0906, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926865\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2864e-01, PNorm = 60.6813, GNorm = 5.5124, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872297\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6282e-01, PNorm = 60.6898, GNorm = 2.2310, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877822\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4311e-01, PNorm = 60.6982, GNorm = 1.7897, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907275\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.1647e-01, PNorm = 60.7064, GNorm = 2.5156, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919389\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2049e-01, PNorm = 60.7145, GNorm = 1.5497, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874207\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2113e-01, PNorm = 60.7218, GNorm = 2.4985, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898396\n",
      "100%|██████████| 50/50 [00:48<00:00,  1.02it/s]\n",
      "Model 0 best validation mae = 0.865934 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.865934\n",
      "Ensemble test mae = 0.865934\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.865934\n",
      "Overall test mae = 0.865934 +/- 0.000000\n",
      "Elapsed time = 0:01:26\n",
      "1it [01:25, 85.89s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "New best spearman: 0.06510988006225447\n",
      "HYPERPARAMETER 1\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '3', '--ffn_hidden_size': '3600', '--dropout': '0.7', '--depth': '5'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 279657.55it/s]\n",
      "100%|██████████| 500/500 [00:17<00:00, 28.19it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 223006.38it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 361663.55it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 35.09it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 241872.64it/s]\n",
      "437it [00:00, 278769.71it/s]\n",
      "100%|██████████| 437/437 [00:10<00:00, 40.55it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 252293.30it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=3600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.7, inplace=False)\n",
      "    (4): Linear(in_features=3600, out_features=3600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.7, inplace=False)\n",
      "    (7): Linear(in_features=3600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 21,229,201\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.8717e+00, PNorm = 91.4735, GNorm = 54.1944, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900863\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.3264e+00, PNorm = 91.9280, GNorm = 35.8439, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 1.035619\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.0010e+00, PNorm = 92.4134, GNorm = 20.3165, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895945\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6752e+00, PNorm = 92.7200, GNorm = 24.5240, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891573\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4328e+00, PNorm = 92.9042, GNorm = 14.0541, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911774\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3119e+00, PNorm = 93.0212, GNorm = 10.5563, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904468\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1820e+00, PNorm = 93.0998, GNorm = 9.6876, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900201\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1835e+00, PNorm = 93.1571, GNorm = 11.3704, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896530\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1542e+00, PNorm = 93.2031, GNorm = 9.6256, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902002\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0056e+00, PNorm = 93.2413, GNorm = 10.4131, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891922\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0284e+00, PNorm = 93.2732, GNorm = 7.7045, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891957\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0436e+00, PNorm = 93.3018, GNorm = 6.1854, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895807\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6812e-01, PNorm = 93.3289, GNorm = 7.4213, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895456\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8459e-01, PNorm = 93.3535, GNorm = 7.5924, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897534\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0317e+00, PNorm = 93.3758, GNorm = 8.3617, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900472\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8856e-01, PNorm = 93.3971, GNorm = 6.7848, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897876\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0106e+00, PNorm = 93.4166, GNorm = 8.8442, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904279\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1675e-01, PNorm = 93.4350, GNorm = 7.4495, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897585\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4985e-01, PNorm = 93.4515, GNorm = 10.6442, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895831\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8988e-01, PNorm = 93.4662, GNorm = 7.0295, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900401\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6993e-01, PNorm = 93.4804, GNorm = 6.5128, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895037\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8137e-01, PNorm = 93.4932, GNorm = 6.9826, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896970\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9864e-01, PNorm = 93.5050, GNorm = 6.3863, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896383\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4729e-01, PNorm = 93.5160, GNorm = 5.9698, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896573\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6144e-01, PNorm = 93.5260, GNorm = 7.6734, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897779\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0513e-01, PNorm = 93.5352, GNorm = 5.3072, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895811\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2632e-01, PNorm = 93.5435, GNorm = 5.8454, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895966\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6062e-01, PNorm = 93.5510, GNorm = 6.9295, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894028\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0082e-01, PNorm = 93.5581, GNorm = 7.3206, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893685\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4474e-01, PNorm = 93.5646, GNorm = 7.2764, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895132\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4618e-01, PNorm = 93.5705, GNorm = 5.3799, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895729\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9170e-01, PNorm = 93.5763, GNorm = 5.8936, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894536\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6847e-01, PNorm = 93.5812, GNorm = 5.1998, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895119\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6066e-01, PNorm = 93.5855, GNorm = 7.1336, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894819\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2904e-01, PNorm = 93.5896, GNorm = 6.2773, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896991\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3512e-01, PNorm = 93.5932, GNorm = 6.8477, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894778\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6941e-01, PNorm = 93.5967, GNorm = 6.0010, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897730\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1865e-01, PNorm = 93.6000, GNorm = 5.4384, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895441\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0138e-01, PNorm = 93.6031, GNorm = 6.3174, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893925\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2196e-01, PNorm = 93.6059, GNorm = 4.7410, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894546\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4251e-01, PNorm = 93.6083, GNorm = 6.1165, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895905\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3566e-01, PNorm = 93.6105, GNorm = 5.7234, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895450\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2163e-01, PNorm = 93.6125, GNorm = 5.6070, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894976\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4384e-01, PNorm = 93.6144, GNorm = 5.5175, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893957\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0324e-01, PNorm = 93.6163, GNorm = 6.1569, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894731\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2428e-01, PNorm = 93.6180, GNorm = 6.0540, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894721\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1093e-01, PNorm = 93.6195, GNorm = 5.9744, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894170\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1201e-01, PNorm = 93.6209, GNorm = 6.0442, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893763\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4373e-01, PNorm = 93.6222, GNorm = 7.0109, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895093\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9811e-01, PNorm = 93.6233, GNorm = 5.5329, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894462\n",
      "100%|██████████| 50/50 [00:44<00:00,  1.13it/s]\n",
      "Model 0 best validation mae = 0.891573 on epoch 3\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.891573\n",
      "Ensemble test mae = 0.891573\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.891573\n",
      "Overall test mae = 0.891573 +/- 0.000000\n",
      "Elapsed time = 0:01:26\n",
      "2it [02:52, 86.28s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "New best spearman: 0.1252402676175033\n",
      "HYPERPARAMETER 2\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '1', '--ffn_hidden_size': '600', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 270181.91it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 32.27it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 236458.68it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 403635.95it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.08it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 112635.09it/s]\n",
      "437it [00:00, 273527.96it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 38.60it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 237177.90it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 12,199,401\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.0645e+00, PNorm = 71.8135, GNorm = 8.7540, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920045\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0772e+00, PNorm = 72.0256, GNorm = 3.1470, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.929861\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0102e+00, PNorm = 72.1918, GNorm = 3.6187, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945577\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0168e+00, PNorm = 72.2723, GNorm = 2.1197, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908999\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7127e-01, PNorm = 72.3097, GNorm = 3.1359, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924691\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0047e+00, PNorm = 72.3300, GNorm = 3.1261, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945726\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8349e-01, PNorm = 72.3473, GNorm = 4.3129, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899115\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7661e-01, PNorm = 72.3610, GNorm = 2.0149, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914344\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2142e-01, PNorm = 72.3764, GNorm = 1.3726, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900355\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3082e-01, PNorm = 72.3916, GNorm = 4.7610, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912466\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0063e-01, PNorm = 72.4081, GNorm = 1.9030, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890166\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6673e-01, PNorm = 72.4265, GNorm = 1.6890, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911512\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2949e-01, PNorm = 72.4483, GNorm = 3.9364, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915679\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3374e-01, PNorm = 72.4704, GNorm = 1.9504, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895053\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3429e-01, PNorm = 72.4911, GNorm = 2.7791, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902628\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1914e-01, PNorm = 72.5140, GNorm = 1.6966, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898534\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8799e-01, PNorm = 72.5359, GNorm = 4.8752, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887209\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6540e-01, PNorm = 72.5602, GNorm = 1.8800, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871193\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8752e-01, PNorm = 72.5836, GNorm = 5.8502, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878795\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6075e-01, PNorm = 72.6087, GNorm = 2.7187, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874869\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9976e-01, PNorm = 72.6326, GNorm = 1.8996, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875779\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3596e-01, PNorm = 72.6574, GNorm = 1.8925, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.944878\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5226e-01, PNorm = 72.6815, GNorm = 2.3805, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912426\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9756e-01, PNorm = 72.7063, GNorm = 2.3515, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904090\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9938e-01, PNorm = 72.7345, GNorm = 6.9676, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885217\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7678e-01, PNorm = 72.7607, GNorm = 1.4913, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882687\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5981e-01, PNorm = 72.7891, GNorm = 1.7630, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909977\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5564e-01, PNorm = 72.8160, GNorm = 8.2132, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.929229\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9444e-01, PNorm = 72.8414, GNorm = 6.9091, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.939540\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7737e-01, PNorm = 72.8676, GNorm = 9.8002, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.984833\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3199e-01, PNorm = 72.8933, GNorm = 1.7525, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907913\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2013e-01, PNorm = 72.9183, GNorm = 2.8511, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887579\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2967e-01, PNorm = 72.9404, GNorm = 2.8206, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900992\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0647e-01, PNorm = 72.9632, GNorm = 6.4745, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933331\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6678e-01, PNorm = 72.9859, GNorm = 2.4272, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894373\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7787e-01, PNorm = 73.0054, GNorm = 5.0326, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891831\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4857e-01, PNorm = 73.0254, GNorm = 4.8897, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887905\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5575e-01, PNorm = 73.0442, GNorm = 3.7204, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892607\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2908e-01, PNorm = 73.0635, GNorm = 2.3963, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916640\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3504e-01, PNorm = 73.0815, GNorm = 1.9784, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921574\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0325e-01, PNorm = 73.0984, GNorm = 2.8302, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911168\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9038e-01, PNorm = 73.1144, GNorm = 3.4147, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914004\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8565e-01, PNorm = 73.1307, GNorm = 1.9898, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941137\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0077e-01, PNorm = 73.1441, GNorm = 2.5250, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.948206\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9553e-01, PNorm = 73.1570, GNorm = 5.7364, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896895\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6226e-01, PNorm = 73.1697, GNorm = 4.2137, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887873\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0658e-01, PNorm = 73.1816, GNorm = 7.8905, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888394\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3936e-01, PNorm = 73.1925, GNorm = 2.6893, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.928273\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4775e-01, PNorm = 73.2048, GNorm = 4.3925, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910892\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2702e-01, PNorm = 73.2161, GNorm = 4.0667, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917062\n",
      "100%|██████████| 50/50 [01:24<00:00,  1.68s/it]\n",
      "Model 0 best validation mae = 0.871193 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.871193\n",
      "Ensemble test mae = 0.871193\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.871193\n",
      "Overall test mae = 0.871193 +/- 0.000000\n",
      "Elapsed time = 0:02:05\n",
      "3it [04:57, 104.11s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 3,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 3\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '1', '--ffn_hidden_size': '1200', '--dropout': '0.7', '--depth': '3'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 232939.24it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 31.41it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 201726.82it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 268755.26it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 31.42it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 198797.27it/s]\n",
      "437it [00:00, 167236.39it/s]\n",
      "100%|██████████| 437/437 [00:14<00:00, 31.18it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 208119.77it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 12,199,401\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.8332e+00, PNorm = 71.8074, GNorm = 8.9727, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924396\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2445e+00, PNorm = 72.0389, GNorm = 4.2907, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 1.001333\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2320e+00, PNorm = 72.2799, GNorm = 5.0227, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923380\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1124e+00, PNorm = 72.4287, GNorm = 4.7724, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912463\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0493e+00, PNorm = 72.5091, GNorm = 4.0558, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919392\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0434e+00, PNorm = 72.5572, GNorm = 4.1740, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908070\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7553e-01, PNorm = 72.5922, GNorm = 4.2783, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907929\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0105e+00, PNorm = 72.6249, GNorm = 7.0789, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894610\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5006e-01, PNorm = 72.6569, GNorm = 3.1428, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906279\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2166e-01, PNorm = 72.6921, GNorm = 6.3819, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897955\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3013e-01, PNorm = 72.7307, GNorm = 4.0915, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893551\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8171e-01, PNorm = 72.7732, GNorm = 4.8319, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917733\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3330e-01, PNorm = 72.8162, GNorm = 4.8945, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920095\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9786e-01, PNorm = 72.8597, GNorm = 4.2186, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912714\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9062e-01, PNorm = 72.8983, GNorm = 5.5268, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915071\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4208e-01, PNorm = 72.9349, GNorm = 3.4196, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909849\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4319e-01, PNorm = 72.9696, GNorm = 5.1643, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909079\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2979e-01, PNorm = 73.0015, GNorm = 3.6957, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895961\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5706e-01, PNorm = 73.0293, GNorm = 4.8085, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914564\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1094e-01, PNorm = 73.0595, GNorm = 3.1728, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904563\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2435e-01, PNorm = 73.0858, GNorm = 4.2093, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901800\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8229e-01, PNorm = 73.1126, GNorm = 3.4119, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930826\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9756e-01, PNorm = 73.1397, GNorm = 3.8332, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920872\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9013e-01, PNorm = 73.1629, GNorm = 3.8352, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920501\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2257e-01, PNorm = 73.1900, GNorm = 6.8584, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912177\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7227e-01, PNorm = 73.2129, GNorm = 5.1235, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927888\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6525e-01, PNorm = 73.2360, GNorm = 3.7114, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.955207\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1677e-01, PNorm = 73.2573, GNorm = 10.0907, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895511\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0201e-01, PNorm = 73.2754, GNorm = 6.5221, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924512\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5335e-01, PNorm = 73.2934, GNorm = 7.3498, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.953651\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8205e-01, PNorm = 73.3117, GNorm = 5.1659, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893485\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5869e-01, PNorm = 73.3286, GNorm = 3.5532, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904884\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6737e-01, PNorm = 73.3451, GNorm = 2.5892, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926738\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4386e-01, PNorm = 73.3603, GNorm = 5.8848, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933042\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0565e-01, PNorm = 73.3762, GNorm = 4.8942, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889428\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2825e-01, PNorm = 73.3905, GNorm = 4.0702, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.931296\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0752e-01, PNorm = 73.4046, GNorm = 4.0814, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927298\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0683e-01, PNorm = 73.4184, GNorm = 3.9177, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.928513\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8298e-01, PNorm = 73.4323, GNorm = 3.7865, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919286\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8573e-01, PNorm = 73.4456, GNorm = 4.8048, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.942639\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9602e-01, PNorm = 73.4585, GNorm = 4.4809, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900653\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1617e-01, PNorm = 73.4707, GNorm = 3.5688, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900698\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9530e-01, PNorm = 73.4827, GNorm = 4.9510, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926753\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8140e-01, PNorm = 73.4926, GNorm = 3.1009, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933837\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9475e-01, PNorm = 73.5020, GNorm = 4.4180, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883588\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1915e-01, PNorm = 73.5101, GNorm = 6.7492, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926706\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6000e-01, PNorm = 73.5190, GNorm = 4.9423, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890651\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7540e-01, PNorm = 73.5270, GNorm = 3.7285, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930763\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5042e-01, PNorm = 73.5350, GNorm = 5.7566, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902407\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7031e-01, PNorm = 73.5422, GNorm = 3.4631, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.937473\n",
      "100%|██████████| 50/50 [00:54<00:00,  1.08s/it]\n",
      "Model 0 best validation mae = 0.883588 on epoch 44\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.883588\n",
      "Ensemble test mae = 0.883588\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.883588\n",
      "Overall test mae = 0.883588 +/- 0.000000\n",
      "Elapsed time = 0:01:39\n",
      "4it [06:36, 102.12s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.0,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "New best spearman: 0.1277383091015159\n",
      "HYPERPARAMETER 4\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '3', '--ffn_hidden_size': '1200', '--dropout': '0.0', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 285016.58it/s]\n",
      "100%|██████████| 500/500 [00:14<00:00, 33.55it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 217051.54it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 364976.27it/s]\n",
      "100%|██████████| 437/437 [00:14<00:00, 30.18it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 224676.50it/s]\n",
      "437it [00:00, 367832.80it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 36.88it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 224428.90it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.0, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.0, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=1200, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.0, inplace=False)\n",
      "    (4): Linear(in_features=1200, out_features=1200, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.0, inplace=False)\n",
      "    (7): Linear(in_features=1200, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 16,760,401\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.5409e+00, PNorm = 89.4402, GNorm = 7.0836, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901042\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5096e-01, PNorm = 89.6914, GNorm = 0.6907, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.946597\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5453e-01, PNorm = 89.9128, GNorm = 1.7120, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889537\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5683e-01, PNorm = 90.0460, GNorm = 4.6406, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.854473\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8515e-01, PNorm = 90.1315, GNorm = 6.5797, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880802\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9760e-01, PNorm = 90.1976, GNorm = 5.6108, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.860050\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2965e-01, PNorm = 90.2644, GNorm = 3.4537, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.972165\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0463e-01, PNorm = 90.3272, GNorm = 4.6496, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.858524\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4163e-01, PNorm = 90.3880, GNorm = 2.9250, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873237\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0775e-01, PNorm = 90.4464, GNorm = 2.3123, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936456\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4186e-01, PNorm = 90.5112, GNorm = 1.8824, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885795\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7734e-01, PNorm = 90.5835, GNorm = 1.6490, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938630\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4340e-01, PNorm = 90.6576, GNorm = 2.2090, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881261\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.3680e-01, PNorm = 90.7311, GNorm = 1.4553, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908414\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.6847e-01, PNorm = 90.8043, GNorm = 1.8843, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892818\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.3182e-01, PNorm = 90.8769, GNorm = 2.1081, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913917\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.9695e-01, PNorm = 90.9508, GNorm = 2.5313, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887961\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6675e-01, PNorm = 91.0296, GNorm = 2.8097, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873777\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6720e-01, PNorm = 91.1034, GNorm = 3.9848, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.918455\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3321e-01, PNorm = 91.1758, GNorm = 4.7759, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911052\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3364e-01, PNorm = 91.2372, GNorm = 1.7999, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888236\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0774e-01, PNorm = 91.2935, GNorm = 1.6881, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.968040\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0214e-01, PNorm = 91.3427, GNorm = 2.3238, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882005\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7189e-02, PNorm = 91.3856, GNorm = 2.9908, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.950703\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3998e-02, PNorm = 91.4276, GNorm = 3.3973, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912376\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9644e-02, PNorm = 91.4667, GNorm = 1.9821, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910588\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1352e-02, PNorm = 91.5012, GNorm = 1.4563, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916503\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4085e-02, PNorm = 91.5304, GNorm = 0.9884, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912724\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9204e-02, PNorm = 91.5570, GNorm = 1.0419, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933270\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.8883e-02, PNorm = 91.5835, GNorm = 2.2006, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906391\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4082e-02, PNorm = 91.6079, GNorm = 2.6911, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914926\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.0460e-02, PNorm = 91.6323, GNorm = 1.4473, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924977\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.4933e-02, PNorm = 91.6543, GNorm = 1.3506, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926832\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.3942e-02, PNorm = 91.6749, GNorm = 1.5794, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907790\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.2690e-02, PNorm = 91.6926, GNorm = 0.8227, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921635\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.9507e-02, PNorm = 91.7094, GNorm = 0.9565, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926322\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.7425e-02, PNorm = 91.7262, GNorm = 1.0650, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914306\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.7663e-02, PNorm = 91.7412, GNorm = 0.5795, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930523\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.8108e-02, PNorm = 91.7565, GNorm = 1.7466, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924673\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.7684e-02, PNorm = 91.7706, GNorm = 1.9622, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908062\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.5753e-02, PNorm = 91.7842, GNorm = 0.7948, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926622\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4742e-02, PNorm = 91.7964, GNorm = 1.8287, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.932164\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2847e-02, PNorm = 91.8075, GNorm = 1.0621, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921360\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2263e-02, PNorm = 91.8189, GNorm = 0.9296, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913790\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1045e-02, PNorm = 91.8289, GNorm = 0.6151, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920419\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0130e-02, PNorm = 91.8385, GNorm = 1.2386, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923383\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8721e-03, PNorm = 91.8476, GNorm = 0.5615, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917720\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7959e-03, PNorm = 91.8562, GNorm = 0.4416, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915604\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4986e-03, PNorm = 91.8643, GNorm = 0.8310, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.922229\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8298e-03, PNorm = 91.8721, GNorm = 0.4220, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920172\n",
      "100%|██████████| 50/50 [01:24<00:00,  1.69s/it]\n",
      "Model 0 best validation mae = 0.854473 on epoch 3\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.854473\n",
      "Ensemble test mae = 0.854473\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.854473\n",
      "Overall test mae = 0.854473 +/- 0.000000\n",
      "Elapsed time = 0:02:07\n",
      "5it [08:43, 111.02s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 4,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 5\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '3', '--ffn_hidden_size': '3600', '--dropout': '0.3', '--depth': '4'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 297764.02it/s]\n",
      "100%|██████████| 500/500 [00:14<00:00, 34.09it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 221803.49it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 304622.05it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 37.50it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 221205.75it/s]\n",
      "437it [00:00, 368424.29it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 37.66it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 224346.49it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=3600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=3600, out_features=3600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.3, inplace=False)\n",
      "    (7): Linear(in_features=3600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 34,527,601\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.5757e+00, PNorm = 108.6079, GNorm = 5.3034, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894128\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4774e-01, PNorm = 109.0105, GNorm = 2.4200, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.949658\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7328e-01, PNorm = 109.3914, GNorm = 8.5956, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 1.025166\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5304e-01, PNorm = 109.6103, GNorm = 3.2860, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871417\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5437e-01, PNorm = 109.7343, GNorm = 2.5584, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877157\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0557e-01, PNorm = 109.8101, GNorm = 1.6117, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876917\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1775e-01, PNorm = 109.8726, GNorm = 2.0706, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919871\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6784e-01, PNorm = 109.9241, GNorm = 3.7341, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865337\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5981e-01, PNorm = 109.9701, GNorm = 1.5356, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870633\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4417e-01, PNorm = 110.0173, GNorm = 2.0974, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921737\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9554e-01, PNorm = 110.0694, GNorm = 2.1223, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879883\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2906e-01, PNorm = 110.1181, GNorm = 2.2233, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900919\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5195e-01, PNorm = 110.1726, GNorm = 3.0557, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884448\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0685e-01, PNorm = 110.2242, GNorm = 2.2705, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875129\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4966e-01, PNorm = 110.2820, GNorm = 2.1811, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880084\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2388e-01, PNorm = 110.3403, GNorm = 2.0476, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894481\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0132e-01, PNorm = 110.3987, GNorm = 4.7708, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902989\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1086e-01, PNorm = 110.4600, GNorm = 3.0939, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875056\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5195e-01, PNorm = 110.5155, GNorm = 4.5964, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889962\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3951e-01, PNorm = 110.5686, GNorm = 2.7216, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869260\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5422e-01, PNorm = 110.6190, GNorm = 3.5303, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877065\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5316e-01, PNorm = 110.6657, GNorm = 2.1659, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906824\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3894e-01, PNorm = 110.7127, GNorm = 2.2831, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891744\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1479e-01, PNorm = 110.7569, GNorm = 1.9241, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899441\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8884e-01, PNorm = 110.8000, GNorm = 3.2499, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890741\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4121e-01, PNorm = 110.8444, GNorm = 1.9631, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893190\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.5683e-01, PNorm = 110.8862, GNorm = 2.7500, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890569\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.1368e-01, PNorm = 110.9307, GNorm = 3.9276, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898551\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6477e-01, PNorm = 110.9753, GNorm = 4.0235, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916804\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6036e-01, PNorm = 111.0192, GNorm = 4.8237, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936515\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2271e-01, PNorm = 111.0613, GNorm = 2.5356, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908219\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6742e-01, PNorm = 111.1018, GNorm = 2.9108, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900603\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7226e-01, PNorm = 111.1395, GNorm = 2.2200, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906136\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0204e-01, PNorm = 111.1729, GNorm = 3.8989, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.934035\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.8076e-01, PNorm = 111.2072, GNorm = 4.2267, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883603\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7952e-01, PNorm = 111.2398, GNorm = 2.7813, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923293\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4143e-01, PNorm = 111.2711, GNorm = 2.5457, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906707\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.3744e-01, PNorm = 111.3009, GNorm = 2.3076, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908647\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5673e-01, PNorm = 111.3313, GNorm = 3.1320, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910587\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.2411e-01, PNorm = 111.3581, GNorm = 1.8404, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889394\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.1552e-01, PNorm = 111.3843, GNorm = 3.0519, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883581\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.1500e-01, PNorm = 111.4064, GNorm = 2.5309, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897577\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.9243e-01, PNorm = 111.4256, GNorm = 2.7360, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903239\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.9968e-01, PNorm = 111.4464, GNorm = 1.8860, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894443\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.1553e-01, PNorm = 111.4639, GNorm = 3.9596, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884076\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.0346e-01, PNorm = 111.4818, GNorm = 2.5870, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877849\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.9189e-01, PNorm = 111.5005, GNorm = 3.4812, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877359\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.6242e-01, PNorm = 111.5170, GNorm = 2.4163, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901514\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.8220e-01, PNorm = 111.5308, GNorm = 3.9710, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895311\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.7096e-01, PNorm = 111.5425, GNorm = 2.4192, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895625\n",
      "100%|██████████| 50/50 [01:05<00:00,  1.30s/it]\n",
      "Model 0 best validation mae = 0.865337 on epoch 7\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.865337\n",
      "Ensemble test mae = 0.865337\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.865337\n",
      "Overall test mae = 0.865337 +/- 0.000000\n",
      "Elapsed time = 0:01:45\n",
      "6it [10:28, 108.85s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 6\n",
      "{'--hidden_size': '3600', '--ffn_num_layers': '1', '--ffn_hidden_size': '3600', '--dropout': '0.7', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 271440.85it/s]\n",
      "100%|██████████| 500/500 [00:16<00:00, 29.46it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 191520.73it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 312303.77it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.30it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 226593.01it/s]\n",
      "437it [00:00, 350327.00it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 37.81it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 226425.06it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=3800, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 26,939,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7529e+00, PNorm = 87.0100, GNorm = 16.7383, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899147\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1433e+00, PNorm = 87.3605, GNorm = 3.9745, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.988013\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1550e+00, PNorm = 87.6255, GNorm = 4.3141, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901231\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1012e+00, PNorm = 87.7423, GNorm = 4.0849, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909039\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0763e+00, PNorm = 87.7895, GNorm = 4.2262, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910858\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0601e+00, PNorm = 87.8087, GNorm = 4.1656, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910654\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0783e+00, PNorm = 87.8176, GNorm = 4.2187, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906408\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0432e+00, PNorm = 87.8226, GNorm = 4.0504, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914583\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0019e+00, PNorm = 87.8269, GNorm = 2.8448, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900169\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0291e+00, PNorm = 87.8311, GNorm = 4.3139, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904694\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9080e-01, PNorm = 87.8353, GNorm = 4.8982, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921966\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5817e-01, PNorm = 87.8396, GNorm = 3.5637, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945808\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0010e+00, PNorm = 87.8442, GNorm = 4.2686, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914575\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4894e-01, PNorm = 87.8489, GNorm = 4.2050, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930186\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1951e-01, PNorm = 87.8534, GNorm = 5.8328, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917288\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3183e-01, PNorm = 87.8574, GNorm = 3.2227, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912548\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2510e-01, PNorm = 87.8607, GNorm = 4.6761, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910831\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5848e-01, PNorm = 87.8643, GNorm = 5.8177, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902713\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6890e-01, PNorm = 87.8670, GNorm = 5.3197, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911102\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8785e-01, PNorm = 87.8707, GNorm = 3.6761, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900117\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8138e-01, PNorm = 87.8736, GNorm = 3.9795, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911942\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8156e-01, PNorm = 87.8761, GNorm = 3.8327, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923964\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6238e-01, PNorm = 87.8790, GNorm = 5.7843, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902713\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9772e-01, PNorm = 87.8815, GNorm = 3.3390, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914248\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9652e-01, PNorm = 87.8842, GNorm = 6.1993, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913968\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5641e-01, PNorm = 87.8864, GNorm = 4.1331, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915669\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8082e-01, PNorm = 87.8884, GNorm = 3.6432, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916292\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6183e-01, PNorm = 87.8905, GNorm = 5.5930, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898682\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8646e-01, PNorm = 87.8924, GNorm = 7.4639, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924573\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8412e-01, PNorm = 87.8945, GNorm = 4.6071, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908675\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6458e-01, PNorm = 87.8967, GNorm = 3.2859, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905709\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5603e-01, PNorm = 87.8984, GNorm = 3.5900, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916485\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4545e-01, PNorm = 87.9002, GNorm = 3.0373, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907870\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6302e-01, PNorm = 87.9017, GNorm = 4.6883, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910378\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4864e-01, PNorm = 87.9034, GNorm = 3.7537, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905309\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4858e-01, PNorm = 87.9049, GNorm = 5.3798, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910063\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3872e-01, PNorm = 87.9066, GNorm = 4.2135, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903310\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7332e-01, PNorm = 87.9080, GNorm = 3.2062, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908877\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3459e-01, PNorm = 87.9095, GNorm = 4.0808, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921864\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2573e-01, PNorm = 87.9109, GNorm = 3.3716, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902411\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1846e-01, PNorm = 87.9122, GNorm = 3.5472, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904348\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4527e-01, PNorm = 87.9133, GNorm = 3.8714, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906470\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2097e-01, PNorm = 87.9146, GNorm = 3.7331, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899565\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0648e-01, PNorm = 87.9158, GNorm = 3.7857, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907889\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3032e-01, PNorm = 87.9170, GNorm = 3.5561, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904631\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0855e-01, PNorm = 87.9178, GNorm = 5.6229, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915756\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4218e-01, PNorm = 87.9186, GNorm = 3.7681, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890337\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0879e-01, PNorm = 87.9195, GNorm = 3.7117, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915696\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1551e-01, PNorm = 87.9205, GNorm = 7.8873, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907277\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0958e-01, PNorm = 87.9214, GNorm = 6.7240, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911378\n",
      "100%|██████████| 50/50 [02:38<00:00,  3.17s/it]\n",
      "Model 0 best validation mae = 0.890337 on epoch 46\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.890337\n",
      "Ensemble test mae = 0.890337\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.890337\n",
      "Overall test mae = 0.890337 +/- 0.000000\n",
      "Elapsed time = 0:03:22\n",
      "7it [13:50, 139.23s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 4,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 2,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 7\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '2', '--ffn_hidden_size': '3600', '--dropout': '0.3', '--depth': '4'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 304641.49it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 32.96it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 217795.41it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 361592.20it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 36.25it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 194473.30it/s]\n",
      "437it [00:00, 257070.25it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 31.56it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 206525.17it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=3600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=3600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 8,265,601\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.5561e+00, PNorm = 68.9303, GNorm = 3.8161, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890504\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7417e-01, PNorm = 69.0743, GNorm = 4.7872, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874232\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7256e-01, PNorm = 69.2168, GNorm = 8.5857, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.978740\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5811e-01, PNorm = 69.2993, GNorm = 7.0743, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880720\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4949e-01, PNorm = 69.3496, GNorm = 5.3628, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906879\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9742e-01, PNorm = 69.3840, GNorm = 4.4921, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.939920\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3768e-01, PNorm = 69.4140, GNorm = 2.6010, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.950929\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2625e-01, PNorm = 69.4371, GNorm = 5.0696, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876547\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4360e-01, PNorm = 69.4621, GNorm = 1.5485, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.868014\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9038e-01, PNorm = 69.4866, GNorm = 4.2330, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.868229\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5279e-01, PNorm = 69.5184, GNorm = 2.5708, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.864237\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0566e-01, PNorm = 69.5470, GNorm = 2.1898, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882522\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8497e-01, PNorm = 69.5791, GNorm = 2.9502, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878960\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6850e-01, PNorm = 69.6104, GNorm = 1.8188, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881394\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2278e-01, PNorm = 69.6455, GNorm = 1.8829, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877249\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4849e-01, PNorm = 69.6746, GNorm = 2.2305, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874290\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7241e-01, PNorm = 69.7065, GNorm = 5.2363, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881598\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2336e-01, PNorm = 69.7399, GNorm = 1.8069, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873606\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8363e-01, PNorm = 69.7697, GNorm = 2.5030, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879667\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2031e-01, PNorm = 69.7973, GNorm = 1.9060, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887420\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9337e-01, PNorm = 69.8264, GNorm = 2.2242, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902617\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7797e-01, PNorm = 69.8559, GNorm = 2.3009, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909093\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9694e-01, PNorm = 69.8857, GNorm = 2.5783, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899378\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7144e-01, PNorm = 69.9188, GNorm = 1.8240, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916805\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7686e-01, PNorm = 69.9537, GNorm = 4.3709, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886900\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6328e-01, PNorm = 69.9818, GNorm = 2.4085, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889536\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0925e-01, PNorm = 70.0149, GNorm = 2.4449, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908852\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2418e-01, PNorm = 70.0453, GNorm = 3.9451, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907521\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0147e-01, PNorm = 70.0757, GNorm = 2.6060, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912426\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1997e-01, PNorm = 70.1041, GNorm = 4.8483, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927362\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0063e-01, PNorm = 70.1335, GNorm = 1.8834, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898598\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0301e-01, PNorm = 70.1634, GNorm = 2.3806, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886614\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6880e-01, PNorm = 70.1929, GNorm = 2.6738, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885170\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8554e-01, PNorm = 70.2189, GNorm = 4.4758, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916277\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.5136e-01, PNorm = 70.2427, GNorm = 2.4041, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876602\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6490e-01, PNorm = 70.2667, GNorm = 2.1196, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901060\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3041e-01, PNorm = 70.2896, GNorm = 3.7398, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883647\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2630e-01, PNorm = 70.3114, GNorm = 2.0541, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892107\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4007e-01, PNorm = 70.3335, GNorm = 2.3162, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885043\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3559e-01, PNorm = 70.3510, GNorm = 3.0089, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874303\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4698e-01, PNorm = 70.3699, GNorm = 2.3197, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872149\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4991e-01, PNorm = 70.3862, GNorm = 3.1138, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870632\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3746e-01, PNorm = 70.4034, GNorm = 2.1142, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888327\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0527e-01, PNorm = 70.4197, GNorm = 1.7816, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899958\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.1113e-01, PNorm = 70.4335, GNorm = 3.2514, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874927\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9176e-01, PNorm = 70.4479, GNorm = 1.5903, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874663\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.1331e-01, PNorm = 70.4608, GNorm = 1.8032, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880716\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7839e-01, PNorm = 70.4755, GNorm = 2.2367, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903594\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7662e-01, PNorm = 70.4893, GNorm = 2.4480, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887337\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6038e-01, PNorm = 70.5023, GNorm = 1.8267, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902354\n",
      "100%|██████████| 50/50 [00:44<00:00,  1.13it/s]\n",
      "Model 0 best validation mae = 0.864237 on epoch 10\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.864237\n",
      "Ensemble test mae = 0.864237\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.864237\n",
      "Overall test mae = 0.864237 +/- 0.000000\n",
      "Elapsed time = 0:01:26\n",
      "8it [15:16, 122.36s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 3,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.5,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 8\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '3', '--ffn_hidden_size': '1200', '--dropout': '0.5', '--depth': '3'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 253156.93it/s]\n",
      "100%|██████████| 500/500 [00:14<00:00, 34.48it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 216580.81it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 354185.67it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 37.66it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 222656.81it/s]\n",
      "437it [00:00, 359535.28it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 37.89it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 225200.99it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.5, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.5, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=1200, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.5, inplace=False)\n",
      "    (4): Linear(in_features=1200, out_features=1200, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.5, inplace=False)\n",
      "    (7): Linear(in_features=1200, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 16,760,401\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4051e+00, PNorm = 89.4549, GNorm = 21.8463, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904108\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2619e+00, PNorm = 89.7881, GNorm = 7.5783, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901337\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0729e+00, PNorm = 90.1338, GNorm = 8.7831, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.977101\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0395e+00, PNorm = 90.3349, GNorm = 4.5988, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907728\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8670e-01, PNorm = 90.4491, GNorm = 5.2979, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938156\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8009e-01, PNorm = 90.5184, GNorm = 3.5099, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930674\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9277e-01, PNorm = 90.5683, GNorm = 2.9520, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907195\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6209e-01, PNorm = 90.6084, GNorm = 6.1464, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873620\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8234e-01, PNorm = 90.6414, GNorm = 3.1746, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890051\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6239e-01, PNorm = 90.6741, GNorm = 3.9169, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876486\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9791e-01, PNorm = 90.7079, GNorm = 3.2399, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869377\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4463e-01, PNorm = 90.7470, GNorm = 3.0907, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897831\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1915e-01, PNorm = 90.7887, GNorm = 4.1727, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895099\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6106e-01, PNorm = 90.8309, GNorm = 3.8595, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903765\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4588e-01, PNorm = 90.8709, GNorm = 3.5057, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908083\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5231e-01, PNorm = 90.9129, GNorm = 2.4420, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881499\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2346e-01, PNorm = 90.9524, GNorm = 5.0658, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879341\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0678e-01, PNorm = 90.9933, GNorm = 2.9809, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871980\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5489e-01, PNorm = 91.0301, GNorm = 3.6024, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903135\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8937e-01, PNorm = 91.0652, GNorm = 2.7643, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901859\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8954e-01, PNorm = 91.0936, GNorm = 2.7503, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892432\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6329e-01, PNorm = 91.1220, GNorm = 2.7263, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914916\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4703e-01, PNorm = 91.1536, GNorm = 2.5645, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906586\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3810e-01, PNorm = 91.1830, GNorm = 3.2263, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913227\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1540e-01, PNorm = 91.2153, GNorm = 3.9956, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896001\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9510e-01, PNorm = 91.2428, GNorm = 2.9952, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895223\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1904e-01, PNorm = 91.2715, GNorm = 3.3218, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916157\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9392e-01, PNorm = 91.2989, GNorm = 4.6666, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896215\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4809e-01, PNorm = 91.3266, GNorm = 4.1251, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907387\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2019e-01, PNorm = 91.3546, GNorm = 5.6131, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941315\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0416e-01, PNorm = 91.3822, GNorm = 2.9702, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891207\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6171e-01, PNorm = 91.4074, GNorm = 2.7638, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879078\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9334e-01, PNorm = 91.4312, GNorm = 2.3511, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893869\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4410e-01, PNorm = 91.4533, GNorm = 5.2827, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923355\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7034e-01, PNorm = 91.4747, GNorm = 2.7345, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873989\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3725e-01, PNorm = 91.4942, GNorm = 2.7484, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898036\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5451e-01, PNorm = 91.5160, GNorm = 2.8271, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887821\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5123e-01, PNorm = 91.5372, GNorm = 2.8969, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888698\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6588e-01, PNorm = 91.5597, GNorm = 3.4458, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895859\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1638e-01, PNorm = 91.5805, GNorm = 2.7430, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905264\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8523e-01, PNorm = 91.6002, GNorm = 3.0665, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891779\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2529e-01, PNorm = 91.6181, GNorm = 3.0191, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885859\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9456e-01, PNorm = 91.6357, GNorm = 2.9421, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885250\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8789e-01, PNorm = 91.6525, GNorm = 2.2881, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887679\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1561e-01, PNorm = 91.6667, GNorm = 4.7440, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871679\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9338e-01, PNorm = 91.6799, GNorm = 4.4003, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900912\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9746e-01, PNorm = 91.6933, GNorm = 2.7364, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893154\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9476e-01, PNorm = 91.7059, GNorm = 2.7174, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907872\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7818e-01, PNorm = 91.7178, GNorm = 3.9826, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887785\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7906e-01, PNorm = 91.7287, GNorm = 2.4178, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905914\n",
      "100%|██████████| 50/50 [00:50<00:00,  1.01s/it]\n",
      "Model 0 best validation mae = 0.869377 on epoch 10\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.869377\n",
      "Ensemble test mae = 0.869377\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.869377\n",
      "Overall test mae = 0.869377 +/- 0.000000\n",
      "Elapsed time = 0:01:29\n",
      "9it [16:45, 112.09s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 9\n",
      "{'--hidden_size': '3600', '--ffn_num_layers': '1', '--ffn_hidden_size': '600', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 251095.79it/s]\n",
      "100%|██████████| 500/500 [00:16<00:00, 30.46it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 108959.94it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 136580.54it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.45it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 222792.13it/s]\n",
      "437it [00:00, 338988.51it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 36.97it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 236078.16it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=3800, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 26,939,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.3958e+00, PNorm = 87.0283, GNorm = 5.0413, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910734\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0953e+00, PNorm = 87.3805, GNorm = 1.7195, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924802\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0251e+00, PNorm = 87.6550, GNorm = 2.3342, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915488\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9544e-01, PNorm = 87.7838, GNorm = 1.7993, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897034\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7368e-01, PNorm = 87.8428, GNorm = 2.5804, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908919\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2662e-01, PNorm = 87.8768, GNorm = 1.8910, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907568\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8570e-01, PNorm = 87.9045, GNorm = 3.5002, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.946017\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8713e-01, PNorm = 87.9327, GNorm = 4.1098, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888096\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2428e-01, PNorm = 87.9642, GNorm = 2.1240, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899320\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2591e-01, PNorm = 87.9878, GNorm = 3.4966, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894433\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1647e-01, PNorm = 88.0201, GNorm = 2.1341, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874971\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0956e-01, PNorm = 88.0475, GNorm = 2.1235, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903949\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8750e-01, PNorm = 88.0792, GNorm = 3.4486, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894593\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7581e-01, PNorm = 88.1126, GNorm = 2.8559, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898567\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6110e-01, PNorm = 88.1455, GNorm = 2.9689, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885508\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5854e-01, PNorm = 88.1853, GNorm = 1.8350, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870181\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3579e-01, PNorm = 88.2266, GNorm = 6.4367, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874113\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9201e-01, PNorm = 88.2712, GNorm = 2.1436, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.864902\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4050e-01, PNorm = 88.3152, GNorm = 6.8904, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881273\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6266e-01, PNorm = 88.3600, GNorm = 4.6812, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865718\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1357e-01, PNorm = 88.4038, GNorm = 2.7877, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870166\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3891e-01, PNorm = 88.4462, GNorm = 1.4940, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902744\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0786e-01, PNorm = 88.4910, GNorm = 2.8062, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887044\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2149e-01, PNorm = 88.5359, GNorm = 1.3251, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886737\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7802e-01, PNorm = 88.5831, GNorm = 4.0902, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879767\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6316e-01, PNorm = 88.6271, GNorm = 1.8550, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908849\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4363e-01, PNorm = 88.6676, GNorm = 2.0665, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936274\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1524e-01, PNorm = 88.7069, GNorm = 3.0901, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897046\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1733e-01, PNorm = 88.7486, GNorm = 6.4282, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891882\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8937e-01, PNorm = 88.7856, GNorm = 3.7440, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878039\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8435e-01, PNorm = 88.8243, GNorm = 4.6199, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876126\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7414e-01, PNorm = 88.8608, GNorm = 4.1629, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909948\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3580e-01, PNorm = 88.8973, GNorm = 2.4499, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927757\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6112e-01, PNorm = 88.9283, GNorm = 8.7047, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880485\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0192e-01, PNorm = 88.9597, GNorm = 5.4334, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.864227\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7512e-01, PNorm = 88.9871, GNorm = 5.4879, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870929\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2826e-01, PNorm = 89.0163, GNorm = 1.8891, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871800\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3573e-01, PNorm = 89.0424, GNorm = 2.1590, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869452\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.8433e-01, PNorm = 89.0674, GNorm = 3.5853, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899381\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9051e-01, PNorm = 89.0907, GNorm = 2.6863, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905364\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5496e-01, PNorm = 89.1125, GNorm = 2.1538, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882668\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4762e-01, PNorm = 89.1331, GNorm = 2.4457, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889389\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4641e-01, PNorm = 89.1543, GNorm = 2.2578, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941612\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5795e-01, PNorm = 89.1743, GNorm = 3.8474, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924628\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.3326e-01, PNorm = 89.1928, GNorm = 2.3647, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881559\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.1403e-01, PNorm = 89.2106, GNorm = 3.0233, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.864168\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.2657e-01, PNorm = 89.2267, GNorm = 5.7850, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.866967\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.2334e-01, PNorm = 89.2412, GNorm = 2.2487, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898704\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.0872e-01, PNorm = 89.2557, GNorm = 1.9716, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870904\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.8135e-01, PNorm = 89.2702, GNorm = 5.6937, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874385\n",
      "100%|██████████| 50/50 [02:42<00:00,  3.25s/it]\n",
      "Model 0 best validation mae = 0.864168 on epoch 45\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.864168\n",
      "Ensemble test mae = 0.864168\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.864168\n",
      "Overall test mae = 0.864168 +/- 0.000000\n",
      "Elapsed time = 0:03:25\n",
      "10it [20:11, 140.88s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "New best spearman: 0.19161837152622288\n",
      "HYPERPARAMETER 10\n",
      "{'--hidden_size': '600', '--ffn_num_layers': '3', '--ffn_hidden_size': '1200', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 307951.84it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 33.17it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 221055.34it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 356181.66it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.71it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 129864.73it/s]\n",
      "437it [00:00, 163960.18it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 35.73it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 223744.00it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=600, bias=False)\n",
      "        (W_h): Linear(in_features=600, out_features=600, bias=False)\n",
      "        (W_o): Linear(in_features=733, out_features=600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=800, out_features=1200, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=1200, out_features=1200, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.3, inplace=False)\n",
      "    (7): Linear(in_features=1200, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 3,292,801\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1893e+00, PNorm = 60.5598, GNorm = 11.9535, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893674\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0447e+00, PNorm = 60.6494, GNorm = 3.2471, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.944981\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0705e-01, PNorm = 60.7629, GNorm = 4.5329, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886980\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4997e-01, PNorm = 60.8424, GNorm = 3.1895, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874399\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6800e-01, PNorm = 60.8972, GNorm = 4.8122, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890834\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7874e-01, PNorm = 60.9374, GNorm = 3.6568, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876538\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8435e-01, PNorm = 60.9704, GNorm = 1.9181, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885152\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0284e-01, PNorm = 61.0011, GNorm = 3.4564, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.868489\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2521e-01, PNorm = 61.0291, GNorm = 1.8346, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.860686\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6104e-01, PNorm = 61.0527, GNorm = 3.6910, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865165\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1101e-01, PNorm = 61.0777, GNorm = 2.1533, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870419\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9221e-01, PNorm = 61.1028, GNorm = 3.9848, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884741\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4751e-01, PNorm = 61.1271, GNorm = 3.5528, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893855\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1195e-01, PNorm = 61.1473, GNorm = 2.2330, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893470\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3556e-01, PNorm = 61.1695, GNorm = 2.3020, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879953\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4490e-01, PNorm = 61.1933, GNorm = 3.1703, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876631\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9919e-01, PNorm = 61.2126, GNorm = 4.7929, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873758\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6116e-01, PNorm = 61.2345, GNorm = 2.8496, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.859082\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7653e-01, PNorm = 61.2546, GNorm = 3.6360, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875730\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2015e-01, PNorm = 61.2715, GNorm = 3.5739, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.867628\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4379e-01, PNorm = 61.2879, GNorm = 3.0567, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871096\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4124e-01, PNorm = 61.3037, GNorm = 2.0913, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890072\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9882e-01, PNorm = 61.3196, GNorm = 2.9952, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880731\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9626e-01, PNorm = 61.3336, GNorm = 2.1745, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893669\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6076e-01, PNorm = 61.3491, GNorm = 5.1558, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880039\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8472e-01, PNorm = 61.3611, GNorm = 3.3716, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875049\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1768e-01, PNorm = 61.3745, GNorm = 2.3193, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887255\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4079e-01, PNorm = 61.3880, GNorm = 4.8811, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887961\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6214e-01, PNorm = 61.3997, GNorm = 4.2337, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899157\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4620e-01, PNorm = 61.4112, GNorm = 6.1365, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914294\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5202e-01, PNorm = 61.4223, GNorm = 2.5285, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894517\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2504e-01, PNorm = 61.4342, GNorm = 2.9664, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880245\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2637e-01, PNorm = 61.4443, GNorm = 2.3086, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880217\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1891e-01, PNorm = 61.4550, GNorm = 5.2170, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900836\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8264e-01, PNorm = 61.4652, GNorm = 2.5118, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.867481\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2558e-01, PNorm = 61.4730, GNorm = 3.0052, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876639\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8562e-01, PNorm = 61.4814, GNorm = 2.6082, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882879\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7484e-01, PNorm = 61.4903, GNorm = 2.5798, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896957\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1319e-01, PNorm = 61.4983, GNorm = 3.7040, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887055\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2341e-01, PNorm = 61.5040, GNorm = 2.9002, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897001\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8412e-01, PNorm = 61.5116, GNorm = 3.6865, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870800\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8918e-01, PNorm = 61.5187, GNorm = 2.2395, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872350\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8081e-01, PNorm = 61.5268, GNorm = 2.8574, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881521\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3161e-01, PNorm = 61.5338, GNorm = 2.4167, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908473\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4784e-01, PNorm = 61.5396, GNorm = 4.4430, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871839\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8392e-01, PNorm = 61.5441, GNorm = 2.9822, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883195\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7347e-01, PNorm = 61.5494, GNorm = 2.4857, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880303\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6539e-01, PNorm = 61.5542, GNorm = 2.9657, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890906\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2069e-01, PNorm = 61.5587, GNorm = 4.5065, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882625\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2969e-01, PNorm = 61.5633, GNorm = 2.7553, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889334\n",
      "100%|██████████| 50/50 [00:39<00:00,  1.27it/s]\n",
      "Model 0 best validation mae = 0.859082 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.859082\n",
      "Ensemble test mae = 0.859082\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.859082\n",
      "Overall test mae = 0.859082 +/- 0.000000\n",
      "Elapsed time = 0:01:20\n",
      "11it [21:31, 122.33s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 11\n",
      "{'--hidden_size': '600', '--ffn_num_layers': '3', '--ffn_hidden_size': '600', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 169507.92it/s]\n",
      "100%|██████████| 500/500 [00:16<00:00, 30.64it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 193839.73it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 321845.63it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.06it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 210800.56it/s]\n",
      "437it [00:00, 345311.01it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.61it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 211628.09it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=600, bias=False)\n",
      "        (W_h): Linear(in_features=600, out_features=600, bias=False)\n",
      "        (W_o): Linear(in_features=733, out_features=600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=800, out_features=600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=600, out_features=600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.3, inplace=False)\n",
      "    (7): Linear(in_features=600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 1,731,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1683e+00, PNorm = 52.7506, GNorm = 4.6343, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892563\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8718e-01, PNorm = 52.8039, GNorm = 3.2665, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913948\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9486e-01, PNorm = 52.8725, GNorm = 5.4083, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889785\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5079e-01, PNorm = 52.9227, GNorm = 2.8762, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.864924\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9101e-01, PNorm = 52.9612, GNorm = 3.5287, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890410\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9165e-01, PNorm = 52.9871, GNorm = 3.2825, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.861814\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6315e-01, PNorm = 53.0080, GNorm = 2.0504, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894224\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1495e-01, PNorm = 53.0273, GNorm = 4.7413, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870081\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5410e-01, PNorm = 53.0447, GNorm = 2.0956, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865579\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9371e-01, PNorm = 53.0593, GNorm = 3.9497, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.867655\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4980e-01, PNorm = 53.0762, GNorm = 2.3935, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869529\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5793e-01, PNorm = 53.0916, GNorm = 2.6782, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872828\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5740e-01, PNorm = 53.1105, GNorm = 3.0337, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880396\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5441e-01, PNorm = 53.1258, GNorm = 3.2598, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877582\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6577e-01, PNorm = 53.1396, GNorm = 3.2448, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891863\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3195e-01, PNorm = 53.1567, GNorm = 2.1254, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895134\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2902e-01, PNorm = 53.1702, GNorm = 3.1036, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876182\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1766e-01, PNorm = 53.1849, GNorm = 2.6472, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.873149\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6392e-01, PNorm = 53.1999, GNorm = 2.4174, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896773\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5481e-01, PNorm = 53.2121, GNorm = 2.8297, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875216\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0150e-01, PNorm = 53.2232, GNorm = 2.6907, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874892\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6690e-01, PNorm = 53.2340, GNorm = 2.2515, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904115\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1418e-01, PNorm = 53.2462, GNorm = 2.2441, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882373\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5906e-01, PNorm = 53.2560, GNorm = 2.2920, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894469\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2410e-01, PNorm = 53.2671, GNorm = 3.5111, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887481\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9050e-01, PNorm = 53.2768, GNorm = 2.7002, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888099\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5486e-01, PNorm = 53.2874, GNorm = 2.1914, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896146\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7882e-01, PNorm = 53.2987, GNorm = 4.5667, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881369\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0035e-01, PNorm = 53.3092, GNorm = 2.9127, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888665\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9817e-01, PNorm = 53.3190, GNorm = 5.8093, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.934984\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9842e-01, PNorm = 53.3281, GNorm = 2.1033, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901986\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9555e-01, PNorm = 53.3385, GNorm = 3.5392, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882526\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8216e-01, PNorm = 53.3470, GNorm = 2.0236, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902061\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8999e-01, PNorm = 53.3556, GNorm = 4.8612, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909207\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6905e-01, PNorm = 53.3641, GNorm = 3.0071, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875497\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7694e-01, PNorm = 53.3719, GNorm = 2.6943, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890744\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5190e-01, PNorm = 53.3794, GNorm = 2.4438, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895354\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5021e-01, PNorm = 53.3868, GNorm = 2.0690, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917584\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7798e-01, PNorm = 53.3952, GNorm = 2.7395, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903352\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5155e-01, PNorm = 53.4014, GNorm = 2.1925, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892875\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4484e-01, PNorm = 53.4081, GNorm = 2.9534, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875969\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5426e-01, PNorm = 53.4139, GNorm = 2.2209, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886540\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2973e-01, PNorm = 53.4202, GNorm = 2.7822, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894623\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9113e-01, PNorm = 53.4261, GNorm = 2.3462, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905926\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1991e-01, PNorm = 53.4315, GNorm = 3.6858, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876381\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5914e-01, PNorm = 53.4360, GNorm = 3.8123, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910136\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2140e-01, PNorm = 53.4412, GNorm = 3.0548, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892692\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0645e-01, PNorm = 53.4455, GNorm = 2.2740, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902008\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8872e-01, PNorm = 53.4495, GNorm = 3.2133, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883222\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8919e-01, PNorm = 53.4533, GNorm = 3.0319, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901820\n",
      "100%|██████████| 50/50 [00:39<00:00,  1.27it/s]\n",
      "Model 0 best validation mae = 0.861814 on epoch 5\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.861814\n",
      "Ensemble test mae = 0.861814\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.861814\n",
      "Overall test mae = 0.861814 +/- 0.000000\n",
      "Elapsed time = 0:01:22\n",
      "12it [22:53, 110.21s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.0,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 2400,\n",
      " 'ffn_num_layers': 2,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 12\n",
      "{'--hidden_size': '3600', '--ffn_num_layers': '2', '--ffn_hidden_size': '2400', '--dropout': '0.0', '--depth': '5'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 258939.62it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 32.86it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 211769.36it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 331808.63it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.41it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 198646.46it/s]\n",
      "437it [00:00, 253409.49it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 32.18it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 203679.39it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.0, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.0, inplace=False)\n",
      "    (1): Linear(in_features=3800, out_features=2400, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.0, inplace=False)\n",
      "    (4): Linear(in_features=2400, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 36,060,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.6881e+00, PNorm = 102.6094, GNorm = 1.6674, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.934338\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5305e-01, PNorm = 103.0941, GNorm = 1.2077, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886827\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1803e-01, PNorm = 103.4889, GNorm = 7.4365, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936835\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0749e-01, PNorm = 103.6810, GNorm = 3.2790, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.865975\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3603e-01, PNorm = 103.7785, GNorm = 2.5661, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881636\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5361e-01, PNorm = 103.8359, GNorm = 0.8255, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872594\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7935e-01, PNorm = 103.8852, GNorm = 1.8039, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903693\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6164e-01, PNorm = 103.9306, GNorm = 3.0166, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874558\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2353e-01, PNorm = 103.9794, GNorm = 1.5368, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869537\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0641e-01, PNorm = 104.0290, GNorm = 2.4630, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903863\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7117e-01, PNorm = 104.0884, GNorm = 0.9749, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894809\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3675e-01, PNorm = 104.1552, GNorm = 1.0524, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.931138\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4333e-01, PNorm = 104.2259, GNorm = 3.8635, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899084\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1445e-01, PNorm = 104.3017, GNorm = 0.8461, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887256\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8283e-01, PNorm = 104.3809, GNorm = 0.9172, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887525\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7706e-01, PNorm = 104.4633, GNorm = 3.3673, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879575\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.5604e-01, PNorm = 104.5526, GNorm = 4.3266, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887715\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0706e-01, PNorm = 104.6460, GNorm = 1.1904, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880127\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0251e-01, PNorm = 104.7442, GNorm = 2.2718, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912715\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6380e-01, PNorm = 104.8543, GNorm = 2.4232, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897254\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5990e-01, PNorm = 104.9672, GNorm = 1.4883, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938405\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.3809e-01, PNorm = 105.0741, GNorm = 0.8333, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.940915\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.2587e-01, PNorm = 105.1779, GNorm = 2.2535, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919045\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.9450e-01, PNorm = 105.2885, GNorm = 1.2439, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907520\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.6950e-01, PNorm = 105.4002, GNorm = 1.2948, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901658\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.5967e-01, PNorm = 105.5184, GNorm = 1.6362, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916033\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.4384e-01, PNorm = 105.6266, GNorm = 1.1699, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915920\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.2550e-01, PNorm = 105.7323, GNorm = 1.4474, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926219\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.2019e-01, PNorm = 105.8435, GNorm = 1.4382, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901843\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.0896e-01, PNorm = 105.9449, GNorm = 3.0082, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915685\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.0292e-01, PNorm = 106.0418, GNorm = 4.5285, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901621\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.8425e-01, PNorm = 106.1319, GNorm = 0.9729, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927424\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.7177e-01, PNorm = 106.2232, GNorm = 1.7628, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945817\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.8436e-01, PNorm = 106.3045, GNorm = 5.0367, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920600\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6754e-01, PNorm = 106.3805, GNorm = 1.9077, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893351\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6369e-01, PNorm = 106.4528, GNorm = 2.3867, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907105\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4291e-01, PNorm = 106.5246, GNorm = 1.3107, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.928588\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2949e-01, PNorm = 106.5881, GNorm = 0.7227, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920646\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1622e-01, PNorm = 106.6526, GNorm = 0.9319, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.934705\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1802e-01, PNorm = 106.7084, GNorm = 2.8674, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920322\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1087e-01, PNorm = 106.7645, GNorm = 1.5123, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.932330\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1138e-01, PNorm = 106.8140, GNorm = 0.7226, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945708\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0245e-01, PNorm = 106.8556, GNorm = 0.9717, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.947569\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8354e-02, PNorm = 106.9018, GNorm = 1.5672, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.960809\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1366e-02, PNorm = 106.9411, GNorm = 1.1960, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.950191\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2380e-02, PNorm = 106.9796, GNorm = 1.4690, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945932\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8489e-02, PNorm = 107.0145, GNorm = 0.8684, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941750\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1617e-02, PNorm = 107.0494, GNorm = 1.2144, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.953456\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1592e-02, PNorm = 107.0822, GNorm = 2.3688, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.952457\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8928e-02, PNorm = 107.1144, GNorm = 0.7966, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.950367\n",
      "100%|██████████| 50/50 [02:17<00:00,  2.75s/it]\n",
      "Model 0 best validation mae = 0.865975 on epoch 3\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.865975\n",
      "Ensemble test mae = 0.865975\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.865975\n",
      "Overall test mae = 0.865975 +/- 0.000000\n",
      "Elapsed time = 0:03:01\n",
      "13it [25:54, 131.67s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 3,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.0,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 2,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 13\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '2', '--ffn_hidden_size': '3600', '--dropout': '0.0', '--depth': '3'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 227038.22it/s]\n",
      "100%|██████████| 500/500 [00:17<00:00, 27.95it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 172989.52it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 296299.85it/s]\n",
      "100%|██████████| 437/437 [00:14<00:00, 29.69it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 215763.49it/s]\n",
      "437it [00:00, 3489.66it/s]\n",
      "100%|██████████| 437/437 [00:14<00:00, 31.16it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 207155.39it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.0, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.0, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=3600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.0, inplace=False)\n",
      "    (4): Linear(in_features=3600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 8,265,601\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4897e+00, PNorm = 68.9305, GNorm = 5.1386, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885587\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0014e-01, PNorm = 69.0936, GNorm = 3.1746, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884380\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8897e-01, PNorm = 69.2603, GNorm = 7.9075, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.990034\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6900e-01, PNorm = 69.3653, GNorm = 6.5084, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897452\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6490e-01, PNorm = 69.4369, GNorm = 3.0214, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890776\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5819e-01, PNorm = 69.4940, GNorm = 0.9163, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871825\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6819e-01, PNorm = 69.5544, GNorm = 1.0006, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901237\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3573e-01, PNorm = 69.6096, GNorm = 5.4969, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877368\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1092e-01, PNorm = 69.6558, GNorm = 1.8693, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881747\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8482e-01, PNorm = 69.7052, GNorm = 2.9175, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915719\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2815e-01, PNorm = 69.7602, GNorm = 1.5260, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911755\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.7863e-01, PNorm = 69.8154, GNorm = 1.0701, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919879\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5476e-01, PNorm = 69.8731, GNorm = 2.5740, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888636\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.4571e-01, PNorm = 69.9400, GNorm = 2.1489, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885613\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.9747e-01, PNorm = 70.0106, GNorm = 0.9174, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900613\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.7668e-01, PNorm = 70.0843, GNorm = 1.4667, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902272\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.5154e-01, PNorm = 70.1581, GNorm = 1.2979, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904487\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.4231e-01, PNorm = 70.2400, GNorm = 1.1072, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871510\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.6389e-01, PNorm = 70.2977, GNorm = 2.3572, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911500\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.1444e-01, PNorm = 70.3660, GNorm = 1.7202, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904195\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.9983e-01, PNorm = 70.4270, GNorm = 2.2032, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933418\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.7980e-01, PNorm = 70.4887, GNorm = 0.8973, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914532\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.6492e-01, PNorm = 70.5503, GNorm = 2.5556, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902244\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4793e-01, PNorm = 70.6091, GNorm = 2.4166, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900642\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3704e-01, PNorm = 70.6631, GNorm = 1.2574, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905168\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2567e-01, PNorm = 70.7167, GNorm = 0.9941, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901704\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1644e-01, PNorm = 70.7690, GNorm = 1.6137, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895397\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0742e-01, PNorm = 70.8211, GNorm = 0.6787, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914219\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0243e-01, PNorm = 70.8678, GNorm = 0.9035, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901222\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8863e-02, PNorm = 70.9152, GNorm = 2.6677, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901602\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6976e-02, PNorm = 70.9564, GNorm = 3.6197, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888351\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2017e-02, PNorm = 70.9920, GNorm = 1.0749, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917312\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1990e-02, PNorm = 71.0288, GNorm = 2.0754, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.925804\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1439e-02, PNorm = 71.0597, GNorm = 1.5611, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897794\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9873e-02, PNorm = 71.0887, GNorm = 2.4447, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886916\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2336e-02, PNorm = 71.1157, GNorm = 1.6612, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.918177\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5540e-02, PNorm = 71.1412, GNorm = 0.6544, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913189\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4729e-02, PNorm = 71.1669, GNorm = 0.6424, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908386\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2660e-02, PNorm = 71.1919, GNorm = 0.7174, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919347\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0201e-02, PNorm = 71.2164, GNorm = 1.1644, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902624\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6845e-02, PNorm = 71.2372, GNorm = 0.7686, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911430\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7630e-02, PNorm = 71.2578, GNorm = 0.5528, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915840\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4535e-02, PNorm = 71.2751, GNorm = 0.6755, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923286\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2784e-02, PNorm = 71.2945, GNorm = 0.9468, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.925858\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9382e-02, PNorm = 71.3108, GNorm = 0.6540, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917798\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6457e-02, PNorm = 71.3277, GNorm = 0.9392, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909911\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4244e-02, PNorm = 71.3421, GNorm = 0.8793, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909516\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2930e-02, PNorm = 71.3567, GNorm = 0.8922, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912718\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4218e-02, PNorm = 71.3716, GNorm = 2.0867, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920086\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2486e-02, PNorm = 71.3848, GNorm = 0.8799, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914621\n",
      "100%|██████████| 50/50 [00:42<00:00,  1.17it/s]\n",
      "Model 0 best validation mae = 0.871510 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.871510\n",
      "Ensemble test mae = 0.871510\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.871510\n",
      "Overall test mae = 0.871510 +/- 0.000000\n",
      "Elapsed time = 0:01:30\n",
      "14it [27:25, 119.27s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 4,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.5,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 3600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 14\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '1', '--ffn_hidden_size': '3600', '--dropout': '0.5', '--depth': '4'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "500it [00:00, 182615.12it/s]\n",
      "100%|██████████| 500/500 [00:17<00:00, 29.06it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 111219.35it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 291818.32it/s]\n",
      "100%|██████████| 437/437 [00:15<00:00, 28.29it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 125593.45it/s]\n",
      "437it [00:00, 211481.58it/s]\n",
      "100%|██████████| 437/437 [00:15<00:00, 28.44it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 208380.04it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.5, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.5, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 3,219,801\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4817e+00, PNorm = 52.2687, GNorm = 4.6665, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.932443\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1682e+00, PNorm = 52.3394, GNorm = 3.4978, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.981793\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.2183e+00, PNorm = 52.4203, GNorm = 4.0065, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907704\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0565e+00, PNorm = 52.4727, GNorm = 3.7259, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912698\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0766e+00, PNorm = 52.5032, GNorm = 3.0710, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908242\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6221e-01, PNorm = 52.5224, GNorm = 2.1110, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916375\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4638e-01, PNorm = 52.5390, GNorm = 4.4000, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904877\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7719e-01, PNorm = 52.5575, GNorm = 6.1098, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895354\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0027e+00, PNorm = 52.5751, GNorm = 4.0414, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912792\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.1684e-01, PNorm = 52.5972, GNorm = 6.0265, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891976\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2616e-01, PNorm = 52.6193, GNorm = 2.5765, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895431\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6192e-01, PNorm = 52.6435, GNorm = 2.4513, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920004\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7837e-01, PNorm = 52.6675, GNorm = 4.3684, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916621\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7496e-01, PNorm = 52.6936, GNorm = 3.5183, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914543\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4696e-01, PNorm = 52.7130, GNorm = 2.7420, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899696\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3806e-01, PNorm = 52.7366, GNorm = 2.2443, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901627\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9608e-01, PNorm = 52.7586, GNorm = 3.0661, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907847\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7851e-01, PNorm = 52.7806, GNorm = 2.2557, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887603\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5328e-01, PNorm = 52.8036, GNorm = 6.2681, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900941\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9507e-01, PNorm = 52.8249, GNorm = 2.7174, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889302\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8555e-01, PNorm = 52.8465, GNorm = 2.1608, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892193\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6280e-01, PNorm = 52.8690, GNorm = 3.0535, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.948205\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6676e-01, PNorm = 52.8891, GNorm = 2.3630, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930276\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6934e-01, PNorm = 52.9090, GNorm = 3.3422, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.918404\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4065e-01, PNorm = 52.9315, GNorm = 6.4615, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913062\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6099e-01, PNorm = 52.9516, GNorm = 3.0176, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909560\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1885e-01, PNorm = 52.9701, GNorm = 2.1966, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.922273\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1940e-01, PNorm = 52.9897, GNorm = 4.5356, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.912235\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4716e-01, PNorm = 53.0072, GNorm = 5.4059, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.930405\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6235e-01, PNorm = 53.0240, GNorm = 9.1486, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.969732\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9220e-01, PNorm = 53.0402, GNorm = 2.1359, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909871\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2599e-01, PNorm = 53.0556, GNorm = 3.3054, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894031\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0667e-01, PNorm = 53.0699, GNorm = 1.8463, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905514\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8320e-01, PNorm = 53.0841, GNorm = 6.3816, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941952\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8953e-01, PNorm = 53.0972, GNorm = 3.1321, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903169\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8646e-01, PNorm = 53.1105, GNorm = 2.3400, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926961\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6348e-01, PNorm = 53.1234, GNorm = 2.9398, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910627\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4566e-01, PNorm = 53.1354, GNorm = 2.2907, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.925520\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3648e-01, PNorm = 53.1470, GNorm = 3.9536, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.932798\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8639e-01, PNorm = 53.1575, GNorm = 2.9316, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919326\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3528e-01, PNorm = 53.1669, GNorm = 3.3350, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910786\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5760e-01, PNorm = 53.1753, GNorm = 3.0732, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908702\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2591e-01, PNorm = 53.1839, GNorm = 2.4860, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.929383\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3028e-01, PNorm = 53.1914, GNorm = 2.4948, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936717\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3356e-01, PNorm = 53.1982, GNorm = 5.2257, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885281\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4526e-01, PNorm = 53.2052, GNorm = 3.6641, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897000\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6207e-01, PNorm = 53.2120, GNorm = 3.6492, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911769\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0501e-01, PNorm = 53.2185, GNorm = 2.8125, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.939664\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0653e-01, PNorm = 53.2244, GNorm = 4.4431, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891937\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2169e-01, PNorm = 53.2299, GNorm = 2.5869, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.967135\n",
      "100%|██████████| 50/50 [00:47<00:00,  1.04it/s]\n",
      "Model 0 best validation mae = 0.885281 on epoch 44\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.885281\n",
      "Ensemble test mae = 0.885281\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.885281\n",
      "Overall test mae = 0.885281 +/- 0.000000\n",
      "Elapsed time = 0:01:37\n",
      "15it [29:02, 112.54s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 2400,\n",
      " 'ffn_num_layers': 2,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 2400,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 15\n",
      "{'--hidden_size': '2400', '--ffn_num_layers': '2', '--ffn_hidden_size': '2400', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 247743.89it/s]\n",
      "100%|██████████| 500/500 [00:17<00:00, 29.19it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 142896.70it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 177762.67it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 32.99it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 175515.74it/s]\n",
      "437it [00:00, 289513.64it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 32.82it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 206944.89it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=2400, bias=False)\n",
      "        (W_h): Linear(in_features=2400, out_features=2400, bias=False)\n",
      "        (W_o): Linear(in_features=2533, out_features=2400, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=2600, out_features=2400, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.3, inplace=False)\n",
      "    (4): Linear(in_features=2400, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 18,441,601\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.0438e+00, PNorm = 87.4930, GNorm = 9.9838, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913156\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8656e-01, PNorm = 87.7593, GNorm = 4.2654, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902449\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2618e-01, PNorm = 87.9833, GNorm = 9.2606, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.983436\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0268e-01, PNorm = 88.0954, GNorm = 5.4602, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905184\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3397e-01, PNorm = 88.1503, GNorm = 4.4883, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936638\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7070e-01, PNorm = 88.1795, GNorm = 3.0376, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945977\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3077e-01, PNorm = 88.2002, GNorm = 1.8238, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.922732\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8356e-01, PNorm = 88.2169, GNorm = 5.2451, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.870728\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4514e-01, PNorm = 88.2333, GNorm = 1.8289, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.872580\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8321e-01, PNorm = 88.2490, GNorm = 2.1419, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882501\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4020e-01, PNorm = 88.2698, GNorm = 1.8960, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880521\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3702e-01, PNorm = 88.2938, GNorm = 2.0059, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908603\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3232e-01, PNorm = 88.3208, GNorm = 4.4699, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904556\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1884e-01, PNorm = 88.3446, GNorm = 3.4548, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887089\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8878e-01, PNorm = 88.3720, GNorm = 2.4318, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893910\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.8918e-01, PNorm = 88.3982, GNorm = 1.9519, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906873\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9795e-01, PNorm = 88.4203, GNorm = 4.4470, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902074\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3650e-01, PNorm = 88.4442, GNorm = 2.1664, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876877\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6636e-01, PNorm = 88.4678, GNorm = 5.0662, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903744\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2763e-01, PNorm = 88.4901, GNorm = 3.2301, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890709\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.5584e-01, PNorm = 88.5116, GNorm = 2.7239, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881757\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4976e-01, PNorm = 88.5347, GNorm = 3.6059, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885343\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0592e-01, PNorm = 88.5590, GNorm = 2.8581, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884122\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9308e-01, PNorm = 88.5833, GNorm = 1.8697, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905975\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1246e-01, PNorm = 88.6097, GNorm = 4.7262, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901710\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5236e-01, PNorm = 88.6382, GNorm = 1.7701, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891101\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8497e-01, PNorm = 88.6659, GNorm = 2.0676, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.923770\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3021e-01, PNorm = 88.6954, GNorm = 4.2824, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914227\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7429e-01, PNorm = 88.7246, GNorm = 6.7893, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.941333\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7005e-01, PNorm = 88.7495, GNorm = 7.0945, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.935317\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2992e-01, PNorm = 88.7761, GNorm = 2.0263, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915112\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9110e-01, PNorm = 88.8019, GNorm = 2.8597, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892326\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1740e-01, PNorm = 88.8261, GNorm = 1.8667, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896913\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.9669e-01, PNorm = 88.8506, GNorm = 3.5749, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924503\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6184e-01, PNorm = 88.8739, GNorm = 2.6062, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883264\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6373e-01, PNorm = 88.8947, GNorm = 3.2436, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896999\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6229e-01, PNorm = 88.9152, GNorm = 3.1865, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877658\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4427e-01, PNorm = 88.9361, GNorm = 1.8996, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883270\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4178e-01, PNorm = 88.9572, GNorm = 2.4851, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883666\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6083e-01, PNorm = 88.9778, GNorm = 1.9583, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880633\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0836e-01, PNorm = 88.9977, GNorm = 2.7981, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877679\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6279e-01, PNorm = 89.0143, GNorm = 2.8997, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877746\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9694e-01, PNorm = 89.0331, GNorm = 3.3247, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878533\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9624e-01, PNorm = 89.0502, GNorm = 2.2106, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876152\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4186e-01, PNorm = 89.0662, GNorm = 3.5096, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.863508\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.1832e-01, PNorm = 89.0821, GNorm = 2.4154, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.869406\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9937e-01, PNorm = 89.0959, GNorm = 2.3945, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.874093\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6195e-01, PNorm = 89.1098, GNorm = 2.9110, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919117\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6918e-01, PNorm = 89.1235, GNorm = 2.6936, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892867\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.5858e-01, PNorm = 89.1354, GNorm = 2.1629, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900251\n",
      "100%|██████████| 50/50 [01:26<00:00,  1.74s/it]\n",
      "Model 0 best validation mae = 0.863508 on epoch 44\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.863508\n",
      "Ensemble test mae = 0.863508\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.863508\n",
      "Overall test mae = 0.863508 +/- 0.000000\n",
      "Elapsed time = 0:02:12\n",
      "16it [31:14, 118.39s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 1200,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 16\n",
      "{'--hidden_size': '1200', '--ffn_num_layers': '1', '--ffn_hidden_size': '1200', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "500it [00:00, 156620.76it/s]\n",
      "100%|██████████| 500/500 [00:16<00:00, 30.31it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 194198.72it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 167480.89it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 32.75it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 213079.61it/s]\n",
      "437it [00:00, 265562.28it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.74it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 212980.58it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=1200, bias=False)\n",
      "        (W_h): Linear(in_features=1200, out_features=1200, bias=False)\n",
      "        (W_o): Linear(in_features=1333, out_features=1200, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=1400, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 3,219,801\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.3768e+00, PNorm = 52.2672, GNorm = 8.2852, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915765\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0632e+00, PNorm = 52.3239, GNorm = 3.3760, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.939292\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9525e-01, PNorm = 52.3819, GNorm = 8.6257, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.969857\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7972e-01, PNorm = 52.4235, GNorm = 4.3989, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926613\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4790e-01, PNorm = 52.4551, GNorm = 6.0058, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.954893\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.6127e-01, PNorm = 52.4847, GNorm = 2.1876, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913320\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8389e-01, PNorm = 52.5126, GNorm = 2.2876, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.942428\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9727e-01, PNorm = 52.5375, GNorm = 5.9096, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887571\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6232e-01, PNorm = 52.5682, GNorm = 2.3461, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890039\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3274e-01, PNorm = 52.5947, GNorm = 3.7377, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890737\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1954e-01, PNorm = 52.6252, GNorm = 2.2380, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893177\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9485e-01, PNorm = 52.6571, GNorm = 2.4527, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908385\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5519e-01, PNorm = 52.6929, GNorm = 4.2245, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889991\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6642e-01, PNorm = 52.7279, GNorm = 2.6494, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890918\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3111e-01, PNorm = 52.7642, GNorm = 3.3730, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886805\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2366e-01, PNorm = 52.8048, GNorm = 1.7358, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.944445\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1438e-01, PNorm = 52.8445, GNorm = 3.7285, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902214\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6686e-01, PNorm = 52.8868, GNorm = 3.3557, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871596\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.0282e-01, PNorm = 52.9194, GNorm = 1.8462, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.963709\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9170e-01, PNorm = 52.9566, GNorm = 1.7494, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905536\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3196e-01, PNorm = 52.9917, GNorm = 3.1961, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.948138\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2874e-01, PNorm = 53.0239, GNorm = 2.8225, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.951428\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.4193e-01, PNorm = 53.0573, GNorm = 2.7497, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893869\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.8983e-01, PNorm = 53.0883, GNorm = 2.3721, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889973\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7882e-01, PNorm = 53.1159, GNorm = 3.8262, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890211\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7798e-01, PNorm = 53.1440, GNorm = 2.0696, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.925646\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6776e-01, PNorm = 53.1707, GNorm = 2.2462, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.956133\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5737e-01, PNorm = 53.1973, GNorm = 2.7151, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.940397\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7498e-01, PNorm = 53.2240, GNorm = 7.9803, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.931079\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4386e-01, PNorm = 53.2473, GNorm = 6.0914, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904372\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4337e-01, PNorm = 53.2710, GNorm = 4.9425, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894980\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0742e-01, PNorm = 53.2922, GNorm = 5.5968, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877777\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5884e-01, PNorm = 53.3134, GNorm = 6.3540, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876752\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0997e-01, PNorm = 53.3331, GNorm = 4.3677, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898966\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1247e-01, PNorm = 53.3533, GNorm = 3.0109, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880822\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.0072e-01, PNorm = 53.3689, GNorm = 4.8422, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881946\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8210e-01, PNorm = 53.3859, GNorm = 2.3336, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893273\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7487e-01, PNorm = 53.4009, GNorm = 4.0829, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883609\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4384e-01, PNorm = 53.4165, GNorm = 1.8959, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898002\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3839e-01, PNorm = 53.4303, GNorm = 2.1911, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908878\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0736e-01, PNorm = 53.4430, GNorm = 2.8173, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885352\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.2918e-01, PNorm = 53.4548, GNorm = 4.8448, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894973\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.5721e-01, PNorm = 53.4659, GNorm = 3.1444, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907327\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.4940e-01, PNorm = 53.4774, GNorm = 1.8104, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.906590\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0561e-01, PNorm = 53.4885, GNorm = 5.8566, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879786\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.0497e-01, PNorm = 53.4981, GNorm = 2.7313, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.879842\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.3029e-01, PNorm = 53.5072, GNorm = 8.8672, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883305\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.9706e-01, PNorm = 53.5159, GNorm = 2.3864, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909339\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.8567e-01, PNorm = 53.5239, GNorm = 3.4687, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888192\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 3.6445e-01, PNorm = 53.5325, GNorm = 3.1421, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893366\n",
      "100%|██████████| 50/50 [00:46<00:00,  1.08it/s]\n",
      "Model 0 best validation mae = 0.871596 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.871596\n",
      "Ensemble test mae = 0.871596\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.871596\n",
      "Overall test mae = 0.871596 +/- 0.000000\n",
      "Elapsed time = 0:01:30\n",
      "17it [32:44, 109.79s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 4,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.5,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 17\n",
      "{'--hidden_size': '3600', '--ffn_num_layers': '1', '--ffn_hidden_size': '1200', '--dropout': '0.5', '--depth': '4'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 263660.05it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 32.91it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 207187.51it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 343885.71it/s]\n",
      "100%|██████████| 437/437 [00:12<00:00, 34.62it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 121755.74it/s]\n",
      "437it [00:00, 347142.21it/s]\n",
      "100%|██████████| 437/437 [00:15<00:00, 28.45it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 203837.95it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.5, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.5, inplace=False)\n",
      "    (1): Linear(in_features=3800, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 26,939,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 2.2211e+00, PNorm = 87.0075, GNorm = 3.4567, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919467\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0662e+00, PNorm = 87.3269, GNorm = 2.4166, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.921964\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0622e+00, PNorm = 87.5794, GNorm = 3.2364, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913665\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0035e+00, PNorm = 87.7022, GNorm = 2.3952, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898067\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.8757e-01, PNorm = 87.7627, GNorm = 3.4057, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915378\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9877e-01, PNorm = 87.8005, GNorm = 3.0679, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.931143\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7364e-01, PNorm = 87.8353, GNorm = 2.7663, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896290\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4662e-01, PNorm = 87.8657, GNorm = 3.4566, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889914\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2076e-01, PNorm = 87.9034, GNorm = 2.9263, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911610\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5239e-01, PNorm = 87.9338, GNorm = 2.9141, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904705\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4369e-01, PNorm = 87.9685, GNorm = 2.5541, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891284\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1162e-01, PNorm = 88.0003, GNorm = 2.8922, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895824\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0244e-01, PNorm = 88.0372, GNorm = 4.8433, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897615\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0991e-01, PNorm = 88.0682, GNorm = 2.1616, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890333\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1770e-01, PNorm = 88.1016, GNorm = 3.0534, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907106\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0189e-01, PNorm = 88.1375, GNorm = 2.0214, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.881674\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8757e-01, PNorm = 88.1740, GNorm = 6.3796, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886476\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6553e-01, PNorm = 88.2131, GNorm = 2.3883, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.868655\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8262e-01, PNorm = 88.2511, GNorm = 6.2649, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888740\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7279e-01, PNorm = 88.2866, GNorm = 2.6400, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894434\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3620e-01, PNorm = 88.3214, GNorm = 2.7350, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888615\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3085e-01, PNorm = 88.3573, GNorm = 2.1924, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911660\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1666e-01, PNorm = 88.3967, GNorm = 2.7757, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895675\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.9513e-01, PNorm = 88.4396, GNorm = 2.2754, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897701\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7256e-01, PNorm = 88.4831, GNorm = 6.1013, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876275\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.1047e-01, PNorm = 88.5240, GNorm = 2.5385, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878683\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6253e-01, PNorm = 88.5637, GNorm = 2.6350, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898804\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6893e-01, PNorm = 88.6005, GNorm = 7.6942, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896381\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.7795e-01, PNorm = 88.6349, GNorm = 4.7062, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919679\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.6861e-01, PNorm = 88.6706, GNorm = 10.3003, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.950339\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.3531e-01, PNorm = 88.7046, GNorm = 3.8142, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920061\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2478e-01, PNorm = 88.7365, GNorm = 2.6658, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902788\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.2368e-01, PNorm = 88.7672, GNorm = 2.4960, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915503\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.0748e-01, PNorm = 88.7960, GNorm = 7.7853, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.931770\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 6.1025e-01, PNorm = 88.8236, GNorm = 2.5374, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883918\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.9099e-01, PNorm = 88.8490, GNorm = 2.7471, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905670\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6779e-01, PNorm = 88.8750, GNorm = 2.6989, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902208\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.7395e-01, PNorm = 88.8986, GNorm = 2.4538, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905411\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.5351e-01, PNorm = 88.9221, GNorm = 3.2126, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.918342\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.6625e-01, PNorm = 88.9433, GNorm = 3.3880, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916398\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2960e-01, PNorm = 88.9642, GNorm = 2.6276, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911896\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1992e-01, PNorm = 88.9848, GNorm = 2.4918, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911880\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.1547e-01, PNorm = 89.0053, GNorm = 3.8040, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936247\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3364e-01, PNorm = 89.0232, GNorm = 1.9747, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.942006\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.2843e-01, PNorm = 89.0386, GNorm = 5.3338, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886459\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.4054e-01, PNorm = 89.0543, GNorm = 2.1527, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883252\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 5.3120e-01, PNorm = 89.0702, GNorm = 3.3967, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904712\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.6730e-01, PNorm = 89.0843, GNorm = 2.7835, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.944664\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.7978e-01, PNorm = 89.0968, GNorm = 2.8887, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897630\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 4.8439e-01, PNorm = 89.1093, GNorm = 3.4725, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.915380\n",
      "100%|██████████| 50/50 [01:51<00:00,  2.23s/it]\n",
      "Model 0 best validation mae = 0.868655 on epoch 17\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.868655\n",
      "Ensemble test mae = 0.868655\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.868655\n",
      "Overall test mae = 0.868655 +/- 0.000000\n",
      "Elapsed time = 0:02:36\n",
      "18it [35:20, 123.74s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.5,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 1200,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 18\n",
      "{'--hidden_size': '600', '--ffn_num_layers': '3', '--ffn_hidden_size': '1200', '--dropout': '0.5', '--depth': '5'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 253279.23it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 32.86it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 204920.07it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 331029.59it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.10it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 192108.88it/s]\n",
      "437it [00:00, 246590.99it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.56it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 208854.93it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.5, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=600, bias=False)\n",
      "        (W_h): Linear(in_features=600, out_features=600, bias=False)\n",
      "        (W_o): Linear(in_features=733, out_features=600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.5, inplace=False)\n",
      "    (1): Linear(in_features=800, out_features=1200, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.5, inplace=False)\n",
      "    (4): Linear(in_features=1200, out_features=1200, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.5, inplace=False)\n",
      "    (7): Linear(in_features=1200, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 3,292,801\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4973e+00, PNorm = 60.5586, GNorm = 12.8357, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899261\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1825e+00, PNorm = 60.6559, GNorm = 7.4621, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.973007\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1592e+00, PNorm = 60.7733, GNorm = 9.8880, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.953877\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0888e+00, PNorm = 60.8583, GNorm = 7.4985, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.916992\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0228e+00, PNorm = 60.9168, GNorm = 4.4320, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.936565\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0019e+00, PNorm = 60.9582, GNorm = 3.7365, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917258\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5487e-01, PNorm = 60.9906, GNorm = 4.5588, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884130\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.5274e-01, PNorm = 61.0177, GNorm = 4.9906, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.871882\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3036e-01, PNorm = 61.0415, GNorm = 3.7138, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911650\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4782e-01, PNorm = 61.0626, GNorm = 5.1106, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.878286\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.0254e-01, PNorm = 61.0809, GNorm = 3.6418, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.895491\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5626e-01, PNorm = 61.0986, GNorm = 2.8946, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891175\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7301e-01, PNorm = 61.1153, GNorm = 3.6789, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.883944\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.9705e-01, PNorm = 61.1296, GNorm = 4.1801, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897009\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7303e-01, PNorm = 61.1432, GNorm = 3.0769, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896695\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8315e-01, PNorm = 61.1568, GNorm = 2.6324, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886524\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2004e-01, PNorm = 61.1694, GNorm = 3.5516, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.876201\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6952e-01, PNorm = 61.1810, GNorm = 5.0989, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890826\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4175e-01, PNorm = 61.1917, GNorm = 4.2389, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877655\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6772e-01, PNorm = 61.2018, GNorm = 3.6328, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.892646\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5971e-01, PNorm = 61.2110, GNorm = 3.3589, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.887164\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2400e-01, PNorm = 61.2200, GNorm = 3.0617, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891566\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4519e-01, PNorm = 61.2292, GNorm = 3.2678, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888625\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3672e-01, PNorm = 61.2376, GNorm = 2.7680, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894962\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9659e-01, PNorm = 61.2462, GNorm = 3.9886, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877835\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5160e-01, PNorm = 61.2525, GNorm = 3.5931, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898422\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4426e-01, PNorm = 61.2591, GNorm = 3.1065, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891447\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2796e-01, PNorm = 61.2658, GNorm = 4.2863, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886798\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5599e-01, PNorm = 61.2722, GNorm = 4.3964, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.901462\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1321e-01, PNorm = 61.2785, GNorm = 3.3053, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890247\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6469e-01, PNorm = 61.2840, GNorm = 2.8816, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888955\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7156e-01, PNorm = 61.2899, GNorm = 3.4636, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890083\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7518e-01, PNorm = 61.2960, GNorm = 2.3955, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888200\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3918e-01, PNorm = 61.3014, GNorm = 4.8065, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913127\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9845e-01, PNorm = 61.3062, GNorm = 3.3840, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.880311\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7744e-01, PNorm = 61.3107, GNorm = 3.0333, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905344\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6506e-01, PNorm = 61.3148, GNorm = 3.5057, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888502\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0960e-01, PNorm = 61.3184, GNorm = 3.2665, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.908366\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4560e-01, PNorm = 61.3220, GNorm = 3.1797, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896023\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6969e-01, PNorm = 61.3256, GNorm = 3.0383, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900119\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5182e-01, PNorm = 61.3292, GNorm = 3.2758, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885615\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7584e-01, PNorm = 61.3318, GNorm = 3.1387, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896753\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5389e-01, PNorm = 61.3342, GNorm = 2.8168, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.889787\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.4924e-01, PNorm = 61.3366, GNorm = 2.5478, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893187\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.2037e-01, PNorm = 61.3398, GNorm = 2.9410, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893462\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3665e-01, PNorm = 61.3426, GNorm = 4.1221, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896069\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8037e-01, PNorm = 61.3445, GNorm = 2.7715, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886760\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5373e-01, PNorm = 61.3463, GNorm = 3.1007, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891304\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.3775e-01, PNorm = 61.3485, GNorm = 4.4347, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.899471\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.5724e-01, PNorm = 61.3508, GNorm = 3.3102, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.891945\n",
      "100%|██████████| 50/50 [00:38<00:00,  1.30it/s]\n",
      "Model 0 best validation mae = 0.871882 on epoch 7\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Loading pretrained parameter \"readout.4.weight\".\n",
      "Loading pretrained parameter \"readout.4.bias\".\n",
      "Loading pretrained parameter \"readout.7.weight\".\n",
      "Loading pretrained parameter \"readout.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.871882\n",
      "Ensemble test mae = 0.871882\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.871882\n",
      "Overall test mae = 0.871882 +/- 0.000000\n",
      "Elapsed time = 0:01:21\n",
      "19it [36:41, 110.83s/it]Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.5,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HYPERPARAMETER 19\n",
      "{'--hidden_size': '600', '--ffn_num_layers': '1', '--ffn_hidden_size': '600', '--dropout': '0.5', '--depth': '6'}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "500it [00:00, 278802.45it/s]\n",
      "100%|██████████| 500/500 [00:15<00:00, 33.02it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 131846.60it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 179538.73it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.33it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 126051.22it/s]\n",
      "437it [00:00, 333014.33it/s]\n",
      "100%|██████████| 437/437 [00:13<00:00, 33.05it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 205023.58it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.5, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=600, bias=False)\n",
      "        (W_h): Linear(in_features=600, out_features=600, bias=False)\n",
      "        (W_o): Linear(in_features=733, out_features=600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.5, inplace=False)\n",
      "    (1): Linear(in_features=800, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 890,001\n",
      "Moving model to cuda\n",
      "Epoch 0\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.4639e+00, PNorm = 38.6543, GNorm = 5.1769, lr_0 = 5.9500e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897666\n",
      "Epoch 1\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1355e+00, PNorm = 38.6793, GNorm = 4.9261, lr_0 = 9.9521e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920968\n",
      "Epoch 2\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1236e+00, PNorm = 38.7083, GNorm = 3.4259, lr_0 = 9.4860e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.938060\n",
      "Epoch 3\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.1896e+00, PNorm = 38.7300, GNorm = 3.1976, lr_0 = 9.0417e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.884110\n",
      "Epoch 4\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0414e+00, PNorm = 38.7438, GNorm = 3.7018, lr_0 = 8.6182e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.911345\n",
      "Epoch 5\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0690e+00, PNorm = 38.7547, GNorm = 2.6214, lr_0 = 8.2145e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920675\n",
      "Epoch 6\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0762e+00, PNorm = 38.7642, GNorm = 4.6695, lr_0 = 7.8298e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900389\n",
      "Epoch 7\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0849e+00, PNorm = 38.7725, GNorm = 3.9615, lr_0 = 7.4631e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.877923\n",
      "Epoch 8\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 1.0102e+00, PNorm = 38.7802, GNorm = 2.8533, lr_0 = 7.1135e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896216\n",
      "Epoch 9\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7327e-01, PNorm = 38.7886, GNorm = 5.3420, lr_0 = 6.7803e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.875437\n",
      "Epoch 10\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.7700e-01, PNorm = 38.7949, GNorm = 4.0104, lr_0 = 6.4627e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903475\n",
      "Epoch 11\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.4997e-01, PNorm = 38.8020, GNorm = 3.7392, lr_0 = 6.1600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905626\n",
      "Epoch 12\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2957e-01, PNorm = 38.8099, GNorm = 2.7017, lr_0 = 5.8715e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.886782\n",
      "Epoch 13\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.3214e-01, PNorm = 38.8164, GNorm = 3.2805, lr_0 = 5.5965e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.907555\n",
      "Epoch 14\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9323e-01, PNorm = 38.8228, GNorm = 4.0677, lr_0 = 5.3344e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.897976\n",
      "Epoch 15\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7961e-01, PNorm = 38.8300, GNorm = 2.6628, lr_0 = 5.0845e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.888662\n",
      "Epoch 16\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6091e-01, PNorm = 38.8365, GNorm = 2.4327, lr_0 = 4.8464e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896701\n",
      "Epoch 17\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 9.2058e-01, PNorm = 38.8437, GNorm = 4.4623, lr_0 = 4.6194e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.882298\n",
      "Epoch 18\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.9140e-01, PNorm = 38.8498, GNorm = 4.5713, lr_0 = 4.4030e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.890728\n",
      "Epoch 19\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4091e-01, PNorm = 38.8564, GNorm = 2.6486, lr_0 = 4.1968e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.894206\n",
      "Epoch 20\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.8011e-01, PNorm = 38.8628, GNorm = 3.6284, lr_0 = 4.0002e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.898499\n",
      "Epoch 21\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.7373e-01, PNorm = 38.8683, GNorm = 2.4491, lr_0 = 3.8129e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927282\n",
      "Epoch 22\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6355e-01, PNorm = 38.8743, GNorm = 2.8185, lr_0 = 3.6343e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.893705\n",
      "Epoch 23\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4144e-01, PNorm = 38.8790, GNorm = 2.2230, lr_0 = 3.4640e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.909591\n",
      "Epoch 24\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5826e-01, PNorm = 38.8837, GNorm = 3.9513, lr_0 = 3.3018e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917319\n",
      "Epoch 25\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1225e-01, PNorm = 38.8882, GNorm = 2.5213, lr_0 = 3.1471e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914651\n",
      "Epoch 26\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1413e-01, PNorm = 38.8932, GNorm = 2.2735, lr_0 = 2.9997e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910144\n",
      "Epoch 27\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.6185e-01, PNorm = 38.8974, GNorm = 8.9849, lr_0 = 2.8592e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.900909\n",
      "Epoch 28\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3271e-01, PNorm = 38.9005, GNorm = 5.1345, lr_0 = 2.7253e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.922953\n",
      "Epoch 29\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.4758e-01, PNorm = 38.9045, GNorm = 4.2926, lr_0 = 2.5977e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.933721\n",
      "Epoch 30\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.2793e-01, PNorm = 38.9085, GNorm = 3.4943, lr_0 = 2.4760e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.885778\n",
      "Epoch 31\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5328e-01, PNorm = 38.9117, GNorm = 4.5387, lr_0 = 2.3600e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.927002\n",
      "Epoch 32\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1926e-01, PNorm = 38.9152, GNorm = 2.4767, lr_0 = 2.2495e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.904929\n",
      "Epoch 33\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0012e-01, PNorm = 38.9187, GNorm = 4.2598, lr_0 = 2.1441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926702\n",
      "Epoch 34\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.3174e-01, PNorm = 38.9219, GNorm = 2.9145, lr_0 = 2.0437e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.905120\n",
      "Epoch 35\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0418e-01, PNorm = 38.9247, GNorm = 2.9174, lr_0 = 1.9480e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.926889\n",
      "Epoch 36\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8194e-01, PNorm = 38.9271, GNorm = 3.1467, lr_0 = 1.8567e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.903847\n",
      "Epoch 37\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.0714e-01, PNorm = 38.9296, GNorm = 2.5762, lr_0 = 1.7698e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.928118\n",
      "Epoch 38\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.5088e-01, PNorm = 38.9328, GNorm = 2.7125, lr_0 = 1.6869e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919694\n",
      "Epoch 39\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9774e-01, PNorm = 38.9354, GNorm = 2.9149, lr_0 = 1.6079e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.925285\n",
      "Epoch 40\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 8.1221e-01, PNorm = 38.9382, GNorm = 2.9992, lr_0 = 1.5326e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.902769\n",
      "Epoch 41\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7893e-01, PNorm = 38.9403, GNorm = 2.7747, lr_0 = 1.4608e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.920588\n",
      "Epoch 42\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7339e-01, PNorm = 38.9424, GNorm = 2.8344, lr_0 = 1.3924e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.914378\n",
      "Epoch 43\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8770e-01, PNorm = 38.9449, GNorm = 2.5085, lr_0 = 1.3271e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.910433\n",
      "Epoch 44\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8755e-01, PNorm = 38.9474, GNorm = 3.8098, lr_0 = 1.2650e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.924404\n",
      "Epoch 45\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.6468e-01, PNorm = 38.9497, GNorm = 3.2669, lr_0 = 1.2057e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.919038\n",
      "Epoch 46\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8241e-01, PNorm = 38.9517, GNorm = 3.3440, lr_0 = 1.1493e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.896808\n",
      "Epoch 47\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.8397e-01, PNorm = 38.9533, GNorm = 4.0562, lr_0 = 1.0954e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.945822\n",
      "Epoch 48\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.9318e-01, PNorm = 38.9552, GNorm = 6.0520, lr_0 = 1.0441e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.913041\n",
      "Epoch 49\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[ALoss = 7.7325e-01, PNorm = 38.9571, GNorm = 4.0595, lr_0 = 1.0000e-04\n",
      "\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[A\n",
      "\u001b[AValidation mae = 0.917844\n",
      "100%|██████████| 50/50 [00:40<00:00,  1.25it/s]\n",
      "Model 0 best validation mae = 0.875437 on epoch 9\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.875437\n",
      "Ensemble test mae = 0.875437\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.875437\n",
      "Overall test mae = 0.875437 +/- 0.000000\n",
      "Elapsed time = 0:01:22\n",
      "20it [38:03, 114.18s/it]\n"
     ]
    }
   ],
   "source": [
    "from copy import copy\n",
    "from tqdm import tqdm\n",
    "from sklearn.model_selection import ParameterSampler\n",
    "\n",
    "hyperparam_list = list(ParameterSampler(param_dict, n_iter=20))\n",
    "\n",
    "best_score = 0.0\n",
    "best_hyperparams = None\n",
    "\n",
    "for i, hyperparam in tqdm(enumerate(hyperparam_list)):\n",
    "    print('HYPERPARAMETER', i)\n",
    "    print(hyperparam)\n",
    "    result_arguments = copy(base_arguments)\n",
    "    for key, value in hyperparam.items():\n",
    "        result_arguments.append(key)\n",
    "        result_arguments.append(value)\n",
    "    # Train\n",
    "    args = chemprop.args.TrainArgs().parse_args(result_arguments)\n",
    "    mean_score, std_score = chemprop.train.cross_validate(args=args, train_func=chemprop.train.run_training)\n",
    "\n",
    "    test_preds = pd.read_csv(temp_datapath + 'checkpoint/test_preds.csv')\n",
    "    metrics = get_lo_metrics(test, test_preds['targets'].to_list())\n",
    "\n",
    "    score = metrics['spearman']\n",
    "    if score > best_score:\n",
    "        print('New best spearman:', score)\n",
    "        best_score = score\n",
    "        best_hyperparams = hyperparam"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'--hidden_size': '3600', '--ffn_num_layers': '1', '--ffn_hidden_size': '600', '--dropout': '0.3', '--depth': '6'}\n"
     ]
    }
   ],
   "source": [
    "print(best_hyperparams)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.19161837152622288\n"
     ]
    }
   ],
   "source": [
    "print(best_score)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Command line\n",
      "python /home/simon/miniconda3/envs/chemprop/lib/python3.8/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"77dd52d3-097b-4972-86c5-fa173d3caa02\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/simon/.local/share/jupyter/runtime/kernel-v2-18626mugnYUVx5iHO.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_bond_types': True,\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_constraints': [],\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'atom_targets': [],\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_constraints': [],\n",
      " 'bond_descriptor_scaling': True,\n",
      " 'bond_descriptors': None,\n",
      " 'bond_descriptors_path': None,\n",
      " 'bond_descriptors_size': 0,\n",
      " 'bond_features_size': 0,\n",
      " 'bond_targets': [],\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'constraints_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'regression',\n",
      " 'depth': 6,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=0),\n",
      " 'dropout': 0.3,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 50,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': ['rdkit_2d_normalized'],\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': False,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 1,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 0,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'is_atom_bond_targets': False,\n",
      " 'keeping_atom_map': False,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'mse',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'mae',\n",
      " 'metrics': ['mae'],\n",
      " 'minimize_score': True,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_adding_bond_types': False,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_descriptor_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': True,\n",
      " 'no_shared_atom_bond_ffn': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_descriptors_path': None,\n",
      " 'separate_test_constraints_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_descriptors_path': None,\n",
      " 'separate_val_constraints_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'shared_atom_bond_ffn': True,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': True,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0,\n",
      " 'weights_ffn_num_layers': 2}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "500it [00:00, 348537.81it/s]\n",
      "100%|██████████| 500/500 [00:12<00:00, 41.02it/s]\n",
      "100%|██████████| 500/500 [00:00<00:00, 246520.75it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "437it [00:00, 388493.19it/s]\n",
      "100%|██████████| 437/437 [00:10<00:00, 43.15it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 245929.27it/s]\n",
      "437it [00:00, 404080.87it/s]\n",
      "100%|██████████| 437/437 [00:11<00:00, 38.40it/s]\n",
      "100%|██████████| 437/437 [00:00<00:00, 216681.74it/s]\n",
      "Total size = 500 | train size = 500 | val size = 437 | test size = 437\n",
      "Fitting scaler\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout): Dropout(p=0.3, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (readout): Sequential(\n",
      "    (0): Dropout(p=0.3, inplace=False)\n",
      "    (1): Linear(in_features=3800, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 26,939,001\n",
      "Moving model to cuda\n",
      "  0%|          | 0/50 [00:00<?, ?it/s]Epoch 0\n",
      "Loss = 2.3958e+00, PNorm = 87.0283, GNorm = 5.0413, lr_0 = 5.9500e-04\n",
      "Validation mae = 0.910734\n",
      "  2%|▏         | 1/50 [00:03<02:44,  3.35s/it]Epoch 1\n",
      "Loss = 1.0953e+00, PNorm = 87.3805, GNorm = 1.7195, lr_0 = 9.9521e-04\n",
      "Validation mae = 0.924802\n",
      "  4%|▍         | 2/50 [00:06<02:35,  3.24s/it]Epoch 2\n",
      "Loss = 1.0251e+00, PNorm = 87.6550, GNorm = 2.3342, lr_0 = 9.4860e-04\n",
      "Validation mae = 0.915488\n",
      "  6%|▌         | 3/50 [00:09<02:30,  3.21s/it]Epoch 3\n",
      "Loss = 9.9544e-01, PNorm = 87.7838, GNorm = 1.7993, lr_0 = 9.0417e-04\n",
      "Validation mae = 0.897034\n",
      "  8%|▊         | 4/50 [00:13<02:29,  3.25s/it]Epoch 4\n",
      "Loss = 9.7368e-01, PNorm = 87.8428, GNorm = 2.5804, lr_0 = 8.6182e-04\n",
      "Validation mae = 0.908919\n",
      " 10%|█         | 5/50 [00:16<02:24,  3.20s/it]Epoch 5\n",
      "Loss = 9.2662e-01, PNorm = 87.8768, GNorm = 1.8910, lr_0 = 8.2145e-04\n",
      "Validation mae = 0.907568\n",
      " 12%|█▏        | 6/50 [00:19<02:19,  3.18s/it]Epoch 6\n",
      "Loss = 8.8570e-01, PNorm = 87.9045, GNorm = 3.5002, lr_0 = 7.8298e-04\n",
      "Validation mae = 0.946017\n",
      " 14%|█▍        | 7/50 [00:22<02:16,  3.16s/it]Epoch 7\n",
      "Loss = 8.8713e-01, PNorm = 87.9327, GNorm = 4.1098, lr_0 = 7.4631e-04\n",
      "Validation mae = 0.888096\n",
      " 16%|█▌        | 8/50 [00:25<02:15,  3.22s/it]Epoch 8\n",
      "Loss = 8.2428e-01, PNorm = 87.9642, GNorm = 2.1240, lr_0 = 7.1135e-04\n",
      "Validation mae = 0.899320\n",
      " 18%|█▊        | 9/50 [00:28<02:11,  3.22s/it]Epoch 9\n",
      "Loss = 8.2591e-01, PNorm = 87.9878, GNorm = 3.4966, lr_0 = 6.7803e-04\n",
      "Validation mae = 0.894433\n",
      " 20%|██        | 10/50 [00:32<02:08,  3.21s/it]Epoch 10\n",
      "Loss = 8.1647e-01, PNorm = 88.0201, GNorm = 2.1341, lr_0 = 6.4627e-04\n",
      "Validation mae = 0.874971\n",
      " 22%|██▏       | 11/50 [00:35<02:07,  3.27s/it]Epoch 11\n",
      "Loss = 8.0956e-01, PNorm = 88.0475, GNorm = 2.1235, lr_0 = 6.1600e-04\n",
      "Validation mae = 0.903949\n",
      " 24%|██▍       | 12/50 [00:38<02:03,  3.24s/it]Epoch 12\n",
      "Loss = 7.8750e-01, PNorm = 88.0792, GNorm = 3.4486, lr_0 = 5.8715e-04\n",
      "Validation mae = 0.894593\n",
      " 26%|██▌       | 13/50 [00:41<01:59,  3.23s/it]Epoch 13\n",
      "Loss = 7.7581e-01, PNorm = 88.1126, GNorm = 2.8559, lr_0 = 5.5965e-04\n",
      "Validation mae = 0.898567\n",
      " 28%|██▊       | 14/50 [00:45<01:55,  3.22s/it]Epoch 14\n",
      "Loss = 7.6110e-01, PNorm = 88.1455, GNorm = 2.9689, lr_0 = 5.3344e-04\n",
      "Validation mae = 0.885508\n",
      " 30%|███       | 15/50 [00:48<01:52,  3.21s/it]Epoch 15\n",
      "Loss = 7.5854e-01, PNorm = 88.1853, GNorm = 1.8350, lr_0 = 5.0845e-04\n",
      "Validation mae = 0.870181\n",
      " 32%|███▏      | 16/50 [00:51<01:50,  3.26s/it]Epoch 16\n",
      "Loss = 7.3579e-01, PNorm = 88.2266, GNorm = 6.4367, lr_0 = 4.8464e-04\n",
      "Validation mae = 0.874113\n",
      " 34%|███▍      | 17/50 [00:54<01:46,  3.23s/it]Epoch 17\n",
      "Loss = 6.9201e-01, PNorm = 88.2712, GNorm = 2.1436, lr_0 = 4.6194e-04\n",
      "Validation mae = 0.864902\n",
      " 36%|███▌      | 18/50 [00:58<01:44,  3.27s/it]Epoch 18\n",
      "Loss = 7.4050e-01, PNorm = 88.3152, GNorm = 6.8904, lr_0 = 4.4030e-04\n",
      "Validation mae = 0.881273\n",
      " 38%|███▊      | 19/50 [01:01<01:40,  3.24s/it]Epoch 19\n",
      "Loss = 6.6266e-01, PNorm = 88.3600, GNorm = 4.6812, lr_0 = 4.1968e-04\n",
      "Validation mae = 0.865718\n",
      " 40%|████      | 20/50 [01:04<01:36,  3.22s/it]Epoch 20\n",
      "Loss = 7.1357e-01, PNorm = 88.4038, GNorm = 2.7877, lr_0 = 4.0002e-04\n",
      "Validation mae = 0.870166\n",
      " 42%|████▏     | 21/50 [01:07<01:32,  3.21s/it]Epoch 21\n",
      "Loss = 6.3891e-01, PNorm = 88.4462, GNorm = 1.4940, lr_0 = 3.8129e-04\n",
      "Validation mae = 0.902744\n",
      " 44%|████▍     | 22/50 [01:10<01:29,  3.19s/it]Epoch 22\n",
      "Loss = 6.0786e-01, PNorm = 88.4910, GNorm = 2.8062, lr_0 = 3.6343e-04\n",
      "Validation mae = 0.887044\n",
      " 46%|████▌     | 23/50 [01:14<01:26,  3.19s/it]Epoch 23\n",
      "Loss = 6.2149e-01, PNorm = 88.5359, GNorm = 1.3251, lr_0 = 3.4640e-04\n",
      "Validation mae = 0.886737\n",
      " 48%|████▊     | 24/50 [01:17<01:23,  3.22s/it]Epoch 24\n",
      "Loss = 5.7802e-01, PNorm = 88.5831, GNorm = 4.0902, lr_0 = 3.3018e-04\n",
      "Validation mae = 0.879767\n",
      " 50%|█████     | 25/50 [01:20<01:20,  3.20s/it]Epoch 25\n",
      "Loss = 5.6316e-01, PNorm = 88.6271, GNorm = 1.8550, lr_0 = 3.1471e-04\n",
      "Validation mae = 0.908849\n",
      " 52%|█████▏    | 26/50 [01:23<01:16,  3.19s/it]Epoch 26\n",
      "Loss = 5.4363e-01, PNorm = 88.6676, GNorm = 2.0665, lr_0 = 2.9997e-04\n",
      "Validation mae = 0.936274\n",
      " 54%|█████▍    | 27/50 [01:26<01:13,  3.19s/it]Epoch 27\n",
      "Loss = 5.1524e-01, PNorm = 88.7069, GNorm = 3.0901, lr_0 = 2.8592e-04\n",
      "Validation mae = 0.897046\n",
      " 56%|█████▌    | 28/50 [01:30<01:10,  3.18s/it]Epoch 28\n",
      "Loss = 5.1733e-01, PNorm = 88.7486, GNorm = 6.4282, lr_0 = 2.7253e-04\n",
      "Validation mae = 0.891882\n",
      " 58%|█████▊    | 29/50 [01:33<01:06,  3.18s/it]Epoch 29\n",
      "Loss = 4.8937e-01, PNorm = 88.7856, GNorm = 3.7440, lr_0 = 2.5977e-04\n",
      "Validation mae = 0.878039\n",
      " 60%|██████    | 30/50 [01:36<01:03,  3.18s/it]Epoch 30\n",
      "Loss = 4.8435e-01, PNorm = 88.8243, GNorm = 4.6199, lr_0 = 2.4760e-04\n",
      "Validation mae = 0.876126\n",
      " 62%|██████▏   | 31/50 [01:39<01:00,  3.18s/it]Epoch 31\n",
      "Loss = 4.7414e-01, PNorm = 88.8608, GNorm = 4.1629, lr_0 = 2.3600e-04\n",
      "Validation mae = 0.909948\n",
      " 64%|██████▍   | 32/50 [01:42<00:57,  3.18s/it]Epoch 32\n",
      "Loss = 4.3580e-01, PNorm = 88.8973, GNorm = 2.4499, lr_0 = 2.2495e-04\n",
      "Validation mae = 0.927757\n",
      " 66%|██████▌   | 33/50 [01:45<00:54,  3.18s/it]Epoch 33\n",
      "Loss = 4.6112e-01, PNorm = 88.9283, GNorm = 8.7047, lr_0 = 2.1441e-04\n",
      "Validation mae = 0.880485\n",
      " 68%|██████▊   | 34/50 [01:49<00:51,  3.19s/it]Epoch 34\n",
      "Loss = 5.0192e-01, PNorm = 88.9597, GNorm = 5.4334, lr_0 = 2.0437e-04\n",
      "Validation mae = 0.864227\n",
      " 70%|███████   | 35/50 [01:52<00:48,  3.24s/it]Epoch 35\n",
      "Loss = 4.7512e-01, PNorm = 88.9871, GNorm = 5.4879, lr_0 = 1.9480e-04\n",
      "Validation mae = 0.870929\n",
      " 72%|███████▏  | 36/50 [01:55<00:45,  3.23s/it]Epoch 36\n",
      "Loss = 4.2826e-01, PNorm = 89.0163, GNorm = 1.8891, lr_0 = 1.8567e-04\n",
      "Validation mae = 0.871800\n",
      " 74%|███████▍  | 37/50 [01:58<00:41,  3.21s/it]Epoch 37\n",
      "Loss = 4.3573e-01, PNorm = 89.0424, GNorm = 2.1590, lr_0 = 1.7698e-04\n",
      "Validation mae = 0.869452\n",
      " 76%|███████▌  | 38/50 [02:02<00:38,  3.20s/it]Epoch 38\n",
      "Loss = 3.8433e-01, PNorm = 89.0674, GNorm = 3.5853, lr_0 = 1.6869e-04\n",
      "Validation mae = 0.899381\n",
      " 78%|███████▊  | 39/50 [02:05<00:35,  3.20s/it]Epoch 39\n",
      "Loss = 3.9051e-01, PNorm = 89.0907, GNorm = 2.6863, lr_0 = 1.6079e-04\n",
      "Validation mae = 0.905364\n",
      " 80%|████████  | 40/50 [02:08<00:31,  3.20s/it]Epoch 40\n",
      "Loss = 3.5496e-01, PNorm = 89.1125, GNorm = 2.1538, lr_0 = 1.5326e-04\n",
      "Validation mae = 0.882668\n",
      " 82%|████████▏ | 41/50 [02:11<00:28,  3.19s/it]Epoch 41\n",
      "Loss = 3.4762e-01, PNorm = 89.1331, GNorm = 2.4457, lr_0 = 1.4608e-04\n",
      "Validation mae = 0.889389\n",
      " 84%|████████▍ | 42/50 [02:14<00:25,  3.20s/it]Epoch 42\n",
      "Loss = 3.4641e-01, PNorm = 89.1543, GNorm = 2.2578, lr_0 = 1.3924e-04\n",
      "Validation mae = 0.941612\n",
      " 86%|████████▌ | 43/50 [02:18<00:22,  3.20s/it]Epoch 43\n",
      "Loss = 3.5795e-01, PNorm = 89.1743, GNorm = 3.8474, lr_0 = 1.3271e-04\n",
      "Validation mae = 0.924628\n",
      " 88%|████████▊ | 44/50 [02:21<00:19,  3.20s/it]Epoch 44\n",
      "Loss = 3.3326e-01, PNorm = 89.1928, GNorm = 2.3647, lr_0 = 1.2650e-04\n",
      "Validation mae = 0.881559\n",
      " 90%|█████████ | 45/50 [02:24<00:15,  3.19s/it]Epoch 45\n",
      "Loss = 3.1403e-01, PNorm = 89.2106, GNorm = 3.0233, lr_0 = 1.2057e-04\n",
      "Validation mae = 0.864168\n",
      " 92%|█████████▏| 46/50 [02:27<00:13,  3.25s/it]Epoch 46\n",
      "Loss = 3.2657e-01, PNorm = 89.2267, GNorm = 5.7850, lr_0 = 1.1493e-04\n",
      "Validation mae = 0.866967\n",
      " 94%|█████████▍| 47/50 [02:30<00:09,  3.23s/it]Epoch 47\n",
      "Loss = 3.2334e-01, PNorm = 89.2412, GNorm = 2.2487, lr_0 = 1.0954e-04\n",
      "Validation mae = 0.898704\n",
      " 96%|█████████▌| 48/50 [02:34<00:06,  3.22s/it]Epoch 48\n",
      "Loss = 3.0872e-01, PNorm = 89.2557, GNorm = 1.9716, lr_0 = 1.0441e-04\n",
      "Validation mae = 0.870904\n",
      " 98%|█████████▊| 49/50 [02:37<00:03,  3.21s/it]Epoch 49\n",
      "Loss = 2.8135e-01, PNorm = 89.2702, GNorm = 5.6937, lr_0 = 1.0000e-04\n",
      "Validation mae = 0.874385\n",
      "100%|██████████| 50/50 [02:40<00:00,  3.21s/it]\n",
      "Model 0 best validation mae = 0.864168 on epoch 45\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"readout.1.weight\".\n",
      "Loading pretrained parameter \"readout.1.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test mae = 0.864168                  \n",
      "Ensemble test mae = 0.864168\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test mae = 0.864168\n",
      "Overall test mae = 0.864168 +/- 0.000000\n",
      "Elapsed time = 0:03:16\n"
     ]
    }
   ],
   "source": [
    "from copy import copy\n",
    "\n",
    "result_arguments = copy(base_arguments)\n",
    "result_arguments.extend([\n",
    "    '--hidden_size', '3600',\n",
    "    '--ffn_num_layers', '1',\n",
    "    '--ffn_hidden_size', '600',\n",
    "    '--dropout', '0.3',\n",
    "    '--depth', '6'\n",
    "])\n",
    "\n",
    "args = chemprop.args.TrainArgs().parse_args(result_arguments)\n",
    "mean_score, std_score = chemprop.train.cross_validate(args=args, train_func=chemprop.train.run_training)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "epoch = 45"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Command line\n",
      "python /home/steshin/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"6c604d94-190d-4da2-9c36-788708df5377\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/steshin/.local/share/jupyter/runtime/kernel-v2-2822374BRuswu5zWdXq.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_feature_scaling': True,\n",
      " 'bond_features_path': None,\n",
      " 'bond_features_size': 0,\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'classification',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=1),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 49,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': None,\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': True,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 1,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'binary_cross_entropy',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'prc-auc',\n",
      " 'metrics': ['prc-auc'],\n",
      " 'minimize_score': False,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_features_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_features_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_features_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': False,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "2385it [00:00, 371763.60it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 342711.81it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 158111.76it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "1190it [00:00, 470736.75it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 207595.63it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 140025.86it/s]\n",
      "1190it [00:00, 484772.90it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 354062.69it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 186545.89it/s]\n",
      "Class sizes\n",
      "targets 0: 29.39%, 1: 70.61%\n",
      "Total size = 2,385 | train size = 2,385 | val size = 1,190 | test size = 1,190\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (sigmoid): Sigmoid()\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout_layer): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (ffn): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=3600, out_features=600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.7, inplace=False)\n",
      "    (4): Linear(in_features=600, out_features=600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.7, inplace=False)\n",
      "    (7): Linear(in_features=600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 29,457,001\n",
      "Moving model to cuda\n",
      "  0%|          | 0/49 [00:00<?, ?it/s]Epoch 0\n",
      "Loss = 1.0067e+00, PNorm = 95.8215, GNorm = 11.3097, lr_0 = 2.0532e-04\n",
      "Loss = 8.2540e-01, PNorm = 95.8920, GNorm = 4.7372, lr_0 = 3.0106e-04\n",
      "Loss = 6.7640e-01, PNorm = 95.9742, GNorm = 3.5823, lr_0 = 3.9681e-04\n",
      "Loss = 6.1312e-01, PNorm = 96.0487, GNorm = 2.5055, lr_0 = 4.9255e-04\n",
      "Validation prc-auc = 0.615862\n",
      "  2%|▏         | 1/49 [00:11<08:52, 11.10s/it]Epoch 1\n",
      "Loss = 6.1991e-01, PNorm = 96.1183, GNorm = 2.2756, lr_0 = 5.9787e-04\n",
      "Loss = 6.4763e-01, PNorm = 96.1786, GNorm = 2.1096, lr_0 = 6.9362e-04\n",
      "Loss = 6.4850e-01, PNorm = 96.2327, GNorm = 2.1754, lr_0 = 7.8936e-04\n",
      "Loss = 6.1910e-01, PNorm = 96.2873, GNorm = 1.6985, lr_0 = 8.8511e-04\n",
      "Loss = 6.2604e-01, PNorm = 96.3436, GNorm = 1.7381, lr_0 = 9.8085e-04\n",
      "Validation prc-auc = 0.629335\n",
      "  4%|▍         | 2/49 [00:22<08:42, 11.11s/it]Epoch 2\n",
      "Loss = 6.2445e-01, PNorm = 96.4006, GNorm = 1.5906, lr_0 = 9.9170e-04\n",
      "Loss = 6.0673e-01, PNorm = 96.4588, GNorm = 1.5449, lr_0 = 9.8141e-04\n",
      "Loss = 6.5753e-01, PNorm = 96.5077, GNorm = 1.1993, lr_0 = 9.7124e-04\n",
      "Loss = 6.1372e-01, PNorm = 96.5569, GNorm = 1.1501, lr_0 = 9.6116e-04\n",
      "Loss = 5.8741e-01, PNorm = 96.5987, GNorm = 1.5248, lr_0 = 9.5120e-04\n",
      "Validation prc-auc = 0.635690\n",
      "  6%|▌         | 3/49 [00:33<08:31, 11.12s/it]Epoch 3\n",
      "Loss = 6.1903e-01, PNorm = 96.6363, GNorm = 1.1153, lr_0 = 9.4133e-04\n",
      "Loss = 5.9095e-01, PNorm = 96.6750, GNorm = 1.1666, lr_0 = 9.3157e-04\n",
      "Loss = 6.3447e-01, PNorm = 96.7094, GNorm = 1.1577, lr_0 = 9.2191e-04\n",
      "Loss = 6.0546e-01, PNorm = 96.7454, GNorm = 1.1495, lr_0 = 9.1235e-04\n",
      "Loss = 6.1925e-01, PNorm = 96.7774, GNorm = 1.0267, lr_0 = 9.0289e-04\n",
      "Loss = 5.3680e-01, PNorm = 96.7807, GNorm = 1.1632, lr_0 = 9.0195e-04\n",
      "Validation prc-auc = 0.641041\n",
      "  8%|▊         | 4/49 [00:44<08:27, 11.29s/it]Epoch 4\n",
      "Loss = 6.1236e-01, PNorm = 96.8128, GNorm = 0.9591, lr_0 = 8.9260e-04\n",
      "Loss = 5.9317e-01, PNorm = 96.8448, GNorm = 1.0099, lr_0 = 8.8334e-04\n",
      "Loss = 5.9902e-01, PNorm = 96.8771, GNorm = 1.0602, lr_0 = 8.7418e-04\n",
      "Loss = 6.0361e-01, PNorm = 96.9112, GNorm = 1.0944, lr_0 = 8.6512e-04\n",
      "Validation prc-auc = 0.660186\n",
      " 10%|█         | 5/49 [00:56<08:21, 11.39s/it]Epoch 5\n",
      "Loss = 5.9755e-01, PNorm = 96.9443, GNorm = 0.9007, lr_0 = 8.5615e-04\n",
      "Loss = 6.1481e-01, PNorm = 96.9818, GNorm = 0.9244, lr_0 = 8.4727e-04\n",
      "Loss = 5.8683e-01, PNorm = 97.0160, GNorm = 1.0581, lr_0 = 8.3848e-04\n",
      "Loss = 6.0921e-01, PNorm = 97.0481, GNorm = 1.1509, lr_0 = 8.2979e-04\n",
      "Loss = 5.9022e-01, PNorm = 97.0812, GNorm = 1.1127, lr_0 = 8.2118e-04\n",
      "Validation prc-auc = 0.651851\n",
      " 12%|█▏        | 6/49 [01:08<08:13, 11.47s/it]Epoch 6\n",
      "Loss = 5.7595e-01, PNorm = 97.1133, GNorm = 0.9377, lr_0 = 8.1267e-04\n",
      "Loss = 6.1230e-01, PNorm = 97.1476, GNorm = 1.0435, lr_0 = 8.0424e-04\n",
      "Loss = 6.2784e-01, PNorm = 97.1783, GNorm = 0.8401, lr_0 = 7.9590e-04\n",
      "Loss = 5.8118e-01, PNorm = 97.2112, GNorm = 1.2101, lr_0 = 7.8765e-04\n",
      "Loss = 5.9307e-01, PNorm = 97.2455, GNorm = 0.8913, lr_0 = 7.7948e-04\n",
      "Validation prc-auc = 0.655969\n",
      " 14%|█▍        | 7/49 [01:19<08:05, 11.55s/it]Epoch 7\n",
      "Loss = 6.4780e-01, PNorm = 97.2792, GNorm = 1.0028, lr_0 = 7.7060e-04\n",
      "Loss = 6.0253e-01, PNorm = 97.3069, GNorm = 0.7932, lr_0 = 7.6261e-04\n",
      "Loss = 5.9209e-01, PNorm = 97.3315, GNorm = 1.2744, lr_0 = 7.5470e-04\n",
      "Loss = 5.9137e-01, PNorm = 97.3523, GNorm = 0.8005, lr_0 = 7.4687e-04\n",
      "Loss = 6.1059e-01, PNorm = 97.3749, GNorm = 0.8399, lr_0 = 7.3913e-04\n",
      "Validation prc-auc = 0.664513\n",
      " 16%|█▋        | 8/49 [01:31<07:57, 11.65s/it]Epoch 8\n",
      "Loss = 5.5741e-01, PNorm = 97.3986, GNorm = 0.8739, lr_0 = 7.3146e-04\n",
      "Loss = 6.2573e-01, PNorm = 97.4220, GNorm = 0.7532, lr_0 = 7.2388e-04\n",
      "Loss = 5.9088e-01, PNorm = 97.4468, GNorm = 1.2770, lr_0 = 7.1637e-04\n",
      "Loss = 5.9256e-01, PNorm = 97.4694, GNorm = 0.7629, lr_0 = 7.0894e-04\n",
      "Validation prc-auc = 0.672864\n",
      " 18%|█▊        | 9/49 [01:43<07:51, 11.79s/it]Epoch 9\n",
      "Loss = 6.5881e-01, PNorm = 97.4916, GNorm = 0.8419, lr_0 = 7.0159e-04\n",
      "Loss = 5.8727e-01, PNorm = 97.5139, GNorm = 0.7291, lr_0 = 6.9432e-04\n",
      "Loss = 5.8728e-01, PNorm = 97.5374, GNorm = 1.0385, lr_0 = 6.8712e-04\n",
      "Loss = 5.8502e-01, PNorm = 97.5633, GNorm = 1.0428, lr_0 = 6.7999e-04\n",
      "Loss = 6.2082e-01, PNorm = 97.5899, GNorm = 0.7921, lr_0 = 6.7294e-04\n",
      "Validation prc-auc = 0.673715\n",
      " 20%|██        | 10/49 [01:55<07:41, 11.83s/it]Epoch 10\n",
      "Loss = 5.7459e-01, PNorm = 97.6175, GNorm = 1.3166, lr_0 = 6.6596e-04\n",
      "Loss = 5.6504e-01, PNorm = 97.6417, GNorm = 0.7604, lr_0 = 6.5906e-04\n",
      "Loss = 5.5505e-01, PNorm = 97.6662, GNorm = 0.7163, lr_0 = 6.5222e-04\n",
      "Loss = 5.8819e-01, PNorm = 97.6906, GNorm = 1.0963, lr_0 = 6.4546e-04\n",
      "Loss = 5.9150e-01, PNorm = 97.7150, GNorm = 0.7214, lr_0 = 6.3877e-04\n",
      "Validation prc-auc = 0.688644\n",
      " 22%|██▏       | 11/49 [02:07<07:30, 11.87s/it]Epoch 11\n",
      "Loss = 5.8862e-01, PNorm = 97.7485, GNorm = 0.7999, lr_0 = 6.3148e-04\n",
      "Loss = 5.8824e-01, PNorm = 97.7823, GNorm = 0.8205, lr_0 = 6.2494e-04\n",
      "Loss = 5.3623e-01, PNorm = 97.8175, GNorm = 0.8394, lr_0 = 6.1846e-04\n",
      "Loss = 5.8235e-01, PNorm = 97.8538, GNorm = 0.7945, lr_0 = 6.1204e-04\n",
      "Loss = 5.7764e-01, PNorm = 97.8898, GNorm = 0.8961, lr_0 = 6.0570e-04\n",
      "Validation prc-auc = 0.679210\n",
      " 24%|██▍       | 12/49 [02:19<07:19, 11.87s/it]Epoch 12\n",
      "Loss = 5.7526e-01, PNorm = 97.9272, GNorm = 0.8109, lr_0 = 5.9941e-04\n",
      "Loss = 5.9038e-01, PNorm = 97.9731, GNorm = 1.1532, lr_0 = 5.9320e-04\n",
      "Loss = 5.5518e-01, PNorm = 98.0209, GNorm = 0.8471, lr_0 = 5.8705e-04\n",
      "Loss = 5.5728e-01, PNorm = 98.0601, GNorm = 0.8460, lr_0 = 5.8096e-04\n",
      "Loss = 5.5681e-01, PNorm = 98.0981, GNorm = 0.8468, lr_0 = 5.7494e-04\n",
      "Validation prc-auc = 0.688309\n",
      " 27%|██▋       | 13/49 [02:31<07:08, 11.89s/it]Epoch 13\n",
      "Loss = 5.6598e-01, PNorm = 98.1387, GNorm = 0.8266, lr_0 = 5.6897e-04\n",
      "Loss = 5.3870e-01, PNorm = 98.1848, GNorm = 0.9767, lr_0 = 5.6307e-04\n",
      "Loss = 5.4043e-01, PNorm = 98.2379, GNorm = 1.1197, lr_0 = 5.5724e-04\n",
      "Loss = 5.4619e-01, PNorm = 98.2980, GNorm = 0.8256, lr_0 = 5.5146e-04\n",
      "Validation prc-auc = 0.699077\n",
      " 29%|██▊       | 14/49 [02:43<06:58, 11.96s/it]Epoch 14\n",
      "Loss = 5.3569e-01, PNorm = 98.3714, GNorm = 0.8903, lr_0 = 5.4517e-04\n",
      "Loss = 5.6463e-01, PNorm = 98.4409, GNorm = 1.2626, lr_0 = 5.3952e-04\n",
      "Loss = 5.4523e-01, PNorm = 98.5052, GNorm = 1.1145, lr_0 = 5.3392e-04\n",
      "Loss = 5.6643e-01, PNorm = 98.5639, GNorm = 0.9076, lr_0 = 5.2839e-04\n",
      "Loss = 5.5523e-01, PNorm = 98.6153, GNorm = 0.7693, lr_0 = 5.2291e-04\n",
      "Validation prc-auc = 0.691737\n",
      " 31%|███       | 15/49 [02:55<06:47, 11.98s/it]Epoch 15\n",
      "Loss = 5.3118e-01, PNorm = 98.6636, GNorm = 0.9687, lr_0 = 5.1748e-04\n",
      "Loss = 5.3933e-01, PNorm = 98.7119, GNorm = 0.8625, lr_0 = 5.1212e-04\n",
      "Loss = 5.4049e-01, PNorm = 98.7619, GNorm = 0.8584, lr_0 = 5.0681e-04\n",
      "Loss = 5.4891e-01, PNorm = 98.8204, GNorm = 0.8701, lr_0 = 5.0155e-04\n",
      "Loss = 6.0999e-01, PNorm = 98.8840, GNorm = 1.5771, lr_0 = 4.9635e-04\n",
      "Validation prc-auc = 0.698665\n",
      " 33%|███▎      | 16/49 [03:07<06:37, 12.05s/it]Epoch 16\n",
      "Loss = 5.5149e-01, PNorm = 98.9355, GNorm = 0.8400, lr_0 = 4.9121e-04\n",
      "Loss = 5.6923e-01, PNorm = 98.9801, GNorm = 0.8205, lr_0 = 4.8611e-04\n",
      "Loss = 5.0741e-01, PNorm = 99.0231, GNorm = 0.9529, lr_0 = 4.8107e-04\n",
      "Loss = 5.1714e-01, PNorm = 99.0660, GNorm = 1.3596, lr_0 = 4.7608e-04\n",
      "Loss = 5.4610e-01, PNorm = 99.1139, GNorm = 1.2540, lr_0 = 4.7115e-04\n",
      "Loss = 5.4559e-01, PNorm = 99.1190, GNorm = 1.1154, lr_0 = 4.7065e-04\n",
      "Validation prc-auc = 0.703012\n",
      " 35%|███▍      | 17/49 [03:20<06:27, 12.09s/it]Epoch 17\n",
      "Loss = 5.6096e-01, PNorm = 99.1730, GNorm = 0.8506, lr_0 = 4.6577e-04\n",
      "Loss = 4.6652e-01, PNorm = 99.2311, GNorm = 1.2833, lr_0 = 4.6094e-04\n",
      "Loss = 5.7133e-01, PNorm = 99.2952, GNorm = 1.4062, lr_0 = 4.5616e-04\n",
      "Loss = 5.1146e-01, PNorm = 99.3744, GNorm = 0.9661, lr_0 = 4.5143e-04\n",
      "Validation prc-auc = 0.702302\n",
      " 37%|███▋      | 18/49 [03:32<06:14, 12.07s/it]Epoch 18\n",
      "Loss = 4.5711e-01, PNorm = 99.4486, GNorm = 0.8978, lr_0 = 4.4675e-04\n",
      "Loss = 5.1450e-01, PNorm = 99.5158, GNorm = 1.0773, lr_0 = 4.4212e-04\n",
      "Loss = 5.4205e-01, PNorm = 99.5852, GNorm = 0.9560, lr_0 = 4.3754e-04\n",
      "Loss = 5.7246e-01, PNorm = 99.6483, GNorm = 1.1926, lr_0 = 4.3300e-04\n",
      "Loss = 4.6836e-01, PNorm = 99.7024, GNorm = 0.8893, lr_0 = 4.2851e-04\n",
      "Validation prc-auc = 0.715082\n",
      " 39%|███▉      | 19/49 [03:44<06:03, 12.12s/it]Epoch 19\n",
      "Loss = 4.8704e-01, PNorm = 99.7477, GNorm = 0.8783, lr_0 = 4.2407e-04\n",
      "Loss = 4.9577e-01, PNorm = 99.7995, GNorm = 1.4950, lr_0 = 4.1967e-04\n",
      "Loss = 5.3146e-01, PNorm = 99.8667, GNorm = 1.1820, lr_0 = 4.1532e-04\n",
      "Loss = 5.1071e-01, PNorm = 99.9379, GNorm = 1.1795, lr_0 = 4.1101e-04\n",
      "Loss = 5.0250e-01, PNorm = 100.0001, GNorm = 1.0708, lr_0 = 4.0675e-04\n",
      "Validation prc-auc = 0.713267\n",
      " 41%|████      | 20/49 [03:56<05:51, 12.12s/it]Epoch 20\n",
      "Loss = 5.1530e-01, PNorm = 100.0550, GNorm = 2.5589, lr_0 = 4.0253e-04\n",
      "Loss = 4.7558e-01, PNorm = 100.1062, GNorm = 0.8899, lr_0 = 3.9836e-04\n",
      "Loss = 5.1477e-01, PNorm = 100.1580, GNorm = 1.3610, lr_0 = 3.9423e-04\n",
      "Loss = 4.8478e-01, PNorm = 100.2147, GNorm = 0.9908, lr_0 = 3.9014e-04\n",
      "Loss = 5.1785e-01, PNorm = 100.2678, GNorm = 1.3075, lr_0 = 3.8609e-04\n",
      "Validation prc-auc = 0.697765\n",
      " 43%|████▎     | 21/49 [04:08<05:42, 12.23s/it]Epoch 21\n",
      "Loss = 4.8804e-01, PNorm = 100.3286, GNorm = 1.9389, lr_0 = 3.8169e-04\n",
      "Loss = 4.4829e-01, PNorm = 100.3923, GNorm = 0.9990, lr_0 = 3.7773e-04\n",
      "Loss = 5.3973e-01, PNorm = 100.4597, GNorm = 1.1261, lr_0 = 3.7382e-04\n",
      "Loss = 4.5359e-01, PNorm = 100.5230, GNorm = 1.4720, lr_0 = 3.6994e-04\n",
      "Validation prc-auc = 0.730478\n",
      " 45%|████▍     | 22/49 [04:21<05:30, 12.25s/it]Epoch 22\n",
      "Loss = 5.0334e-01, PNorm = 100.5881, GNorm = 1.4204, lr_0 = 3.6610e-04\n",
      "Loss = 5.2330e-01, PNorm = 100.6420, GNorm = 1.1426, lr_0 = 3.6231e-04\n",
      "Loss = 4.4600e-01, PNorm = 100.6945, GNorm = 1.3572, lr_0 = 3.5855e-04\n",
      "Loss = 4.6355e-01, PNorm = 100.7440, GNorm = 1.0567, lr_0 = 3.5483e-04\n",
      "Loss = 5.2424e-01, PNorm = 100.7986, GNorm = 1.2341, lr_0 = 3.5115e-04\n",
      "Validation prc-auc = 0.710172\n",
      " 47%|████▋     | 23/49 [04:33<05:17, 12.22s/it]Epoch 23\n",
      "Loss = 4.8506e-01, PNorm = 100.8470, GNorm = 1.5420, lr_0 = 3.4751e-04\n",
      "Loss = 4.8682e-01, PNorm = 100.8904, GNorm = 0.9928, lr_0 = 3.4391e-04\n",
      "Loss = 4.5869e-01, PNorm = 100.9296, GNorm = 2.0953, lr_0 = 3.4034e-04\n",
      "Loss = 5.0980e-01, PNorm = 100.9674, GNorm = 1.1891, lr_0 = 3.3681e-04\n",
      "Loss = 4.5286e-01, PNorm = 101.0165, GNorm = 0.9336, lr_0 = 3.3332e-04\n",
      "Validation prc-auc = 0.728259\n",
      " 49%|████▉     | 24/49 [04:45<05:04, 12.19s/it]Epoch 24\n",
      "Loss = 4.8516e-01, PNorm = 101.0666, GNorm = 1.8970, lr_0 = 3.2952e-04\n",
      "Loss = 4.8621e-01, PNorm = 101.1131, GNorm = 1.4264, lr_0 = 3.2610e-04\n",
      "Loss = 4.3167e-01, PNorm = 101.1564, GNorm = 1.1878, lr_0 = 3.2272e-04\n",
      "Loss = 4.2437e-01, PNorm = 101.2023, GNorm = 2.7617, lr_0 = 3.1937e-04\n",
      "Loss = 4.8904e-01, PNorm = 101.2491, GNorm = 1.7485, lr_0 = 3.1606e-04\n",
      "Validation prc-auc = 0.733935\n",
      " 51%|█████     | 25/49 [04:57<04:53, 12.23s/it]Epoch 25\n",
      "Loss = 5.2475e-01, PNorm = 101.2964, GNorm = 2.3993, lr_0 = 3.1279e-04\n",
      "Loss = 4.6621e-01, PNorm = 101.3451, GNorm = 1.2041, lr_0 = 3.0954e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.3867, GNorm = 1.1062, lr_0 = 3.0633e-04\n",
      "Loss = 4.7162e-01, PNorm = 101.4270, GNorm = 1.3346, lr_0 = 3.0316e-04\n",
      "Loss = 4.3106e-01, PNorm = 101.4674, GNorm = 1.6084, lr_0 = 3.0001e-04\n",
      "Validation prc-auc = 0.729222\n",
      " 53%|█████▎    | 26/49 [05:09<04:40, 12.20s/it]Epoch 26\n",
      "Loss = 4.3461e-01, PNorm = 101.5064, GNorm = 1.1614, lr_0 = 2.9690e-04\n",
      "Loss = 4.8308e-01, PNorm = 101.5477, GNorm = 2.9387, lr_0 = 2.9382e-04\n",
      "Loss = 4.4844e-01, PNorm = 101.5879, GNorm = 1.3525, lr_0 = 2.9078e-04\n",
      "Loss = 4.5905e-01, PNorm = 101.6276, GNorm = 1.7554, lr_0 = 2.8776e-04\n",
      "Validation prc-auc = 0.723556\n",
      " 55%|█████▌    | 27/49 [05:22<04:30, 12.28s/it]Epoch 27\n",
      "Loss = 3.8075e-01, PNorm = 101.6739, GNorm = 1.2324, lr_0 = 2.8448e-04\n",
      "Loss = 4.4958e-01, PNorm = 101.7146, GNorm = 1.6542, lr_0 = 2.8153e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.7589, GNorm = 1.4257, lr_0 = 2.7861e-04\n",
      "Loss = 4.2466e-01, PNorm = 101.8007, GNorm = 1.7038, lr_0 = 2.7572e-04\n",
      "Loss = 4.7970e-01, PNorm = 101.8378, GNorm = 1.3090, lr_0 = 2.7286e-04\n",
      "Validation prc-auc = 0.707338\n",
      " 57%|█████▋    | 28/49 [05:34<04:17, 12.25s/it]Epoch 28\n",
      "Loss = 4.5278e-01, PNorm = 101.8740, GNorm = 1.3734, lr_0 = 2.7003e-04\n",
      "Loss = 4.5094e-01, PNorm = 101.9079, GNorm = 1.0547, lr_0 = 2.6723e-04\n",
      "Loss = 4.1357e-01, PNorm = 101.9411, GNorm = 1.5816, lr_0 = 2.6446e-04\n",
      "Loss = 4.6498e-01, PNorm = 101.9734, GNorm = 1.8609, lr_0 = 2.6172e-04\n",
      "Loss = 4.2933e-01, PNorm = 102.0062, GNorm = 1.0863, lr_0 = 2.5901e-04\n",
      "Validation prc-auc = 0.699879\n",
      " 59%|█████▉    | 29/49 [05:46<04:04, 12.22s/it]Epoch 29\n",
      "Loss = 3.9687e-01, PNorm = 102.0364, GNorm = 1.0911, lr_0 = 2.5632e-04\n",
      "Loss = 3.9953e-01, PNorm = 102.0640, GNorm = 1.2628, lr_0 = 2.5366e-04\n",
      "Loss = 4.5717e-01, PNorm = 102.0935, GNorm = 1.8129, lr_0 = 2.5103e-04\n",
      "Loss = 4.1537e-01, PNorm = 102.1263, GNorm = 1.2622, lr_0 = 2.4843e-04\n",
      "Loss = 4.6298e-01, PNorm = 102.1587, GNorm = 1.6679, lr_0 = 2.4585e-04\n",
      "Validation prc-auc = 0.729581\n",
      " 61%|██████    | 30/49 [05:58<03:52, 12.22s/it]Epoch 30\n",
      "Loss = 4.4116e-01, PNorm = 102.1918, GNorm = 2.3824, lr_0 = 2.4330e-04\n",
      "Loss = 4.4225e-01, PNorm = 102.2200, GNorm = 2.0057, lr_0 = 2.4078e-04\n",
      "Loss = 4.1512e-01, PNorm = 102.2495, GNorm = 1.2579, lr_0 = 2.3828e-04\n",
      "Loss = 4.3965e-01, PNorm = 102.2783, GNorm = 1.9444, lr_0 = 2.3581e-04\n",
      "Validation prc-auc = 0.721862\n",
      " 63%|██████▎   | 31/49 [06:11<03:39, 12.21s/it]Epoch 31\n",
      "Loss = 4.1521e-01, PNorm = 102.3138, GNorm = 2.0351, lr_0 = 2.3312e-04\n",
      "Loss = 4.6530e-01, PNorm = 102.3409, GNorm = 0.9553, lr_0 = 2.3071e-04\n",
      "Loss = 4.4350e-01, PNorm = 102.3687, GNorm = 1.5819, lr_0 = 2.2831e-04\n",
      "Loss = 4.1122e-01, PNorm = 102.3959, GNorm = 1.5397, lr_0 = 2.2595e-04\n",
      "Loss = 3.9777e-01, PNorm = 102.4228, GNorm = 0.9937, lr_0 = 2.2360e-04\n",
      "Validation prc-auc = 0.721970\n",
      " 65%|██████▌   | 32/49 [06:23<03:29, 12.35s/it]Epoch 32\n",
      "Loss = 4.3843e-01, PNorm = 102.4485, GNorm = 3.1887, lr_0 = 2.2129e-04\n",
      "Loss = 3.8235e-01, PNorm = 102.4765, GNorm = 1.1239, lr_0 = 2.1899e-04\n",
      "Loss = 4.2292e-01, PNorm = 102.5009, GNorm = 1.9876, lr_0 = 2.1672e-04\n",
      "Loss = 4.3276e-01, PNorm = 102.5277, GNorm = 1.5407, lr_0 = 2.1447e-04\n",
      "Loss = 4.6404e-01, PNorm = 102.5524, GNorm = 1.9581, lr_0 = 2.1225e-04\n",
      "Validation prc-auc = 0.704753\n",
      " 67%|██████▋   | 33/49 [06:36<03:16, 12.31s/it]Epoch 33\n",
      "Loss = 4.0377e-01, PNorm = 102.5779, GNorm = 1.4487, lr_0 = 2.1005e-04\n",
      "Loss = 4.3812e-01, PNorm = 102.6001, GNorm = 1.7061, lr_0 = 2.0787e-04\n",
      "Loss = 4.1834e-01, PNorm = 102.6218, GNorm = 1.3299, lr_0 = 2.0571e-04\n",
      "Loss = 4.0906e-01, PNorm = 102.6444, GNorm = 1.2884, lr_0 = 2.0358e-04\n",
      "Loss = 4.0979e-01, PNorm = 102.6662, GNorm = 1.7456, lr_0 = 2.0147e-04\n",
      "Validation prc-auc = 0.741242\n",
      " 69%|██████▉   | 34/49 [06:48<03:05, 12.36s/it]Epoch 34\n",
      "Loss = 4.2813e-01, PNorm = 102.6889, GNorm = 2.0504, lr_0 = 1.9917e-04\n",
      "Loss = 4.2911e-01, PNorm = 102.7107, GNorm = 2.0385, lr_0 = 1.9711e-04\n",
      "Loss = 4.0048e-01, PNorm = 102.7322, GNorm = 1.4560, lr_0 = 1.9506e-04\n",
      "Loss = 3.9704e-01, PNorm = 102.7581, GNorm = 1.1820, lr_0 = 1.9304e-04\n",
      "Validation prc-auc = 0.727587\n",
      " 71%|███████▏  | 35/49 [07:00<02:52, 12.30s/it]Epoch 35\n",
      "Loss = 3.3330e-01, PNorm = 102.7780, GNorm = 1.1825, lr_0 = 1.9104e-04\n",
      "Loss = 3.8412e-01, PNorm = 102.7992, GNorm = 1.7658, lr_0 = 1.8906e-04\n",
      "Loss = 3.7517e-01, PNorm = 102.8210, GNorm = 1.2284, lr_0 = 1.8710e-04\n",
      "Loss = 4.5571e-01, PNorm = 102.8433, GNorm = 2.2784, lr_0 = 1.8516e-04\n",
      "Loss = 3.8375e-01, PNorm = 102.8635, GNorm = 1.3376, lr_0 = 1.8324e-04\n",
      "Validation prc-auc = 0.724475\n",
      " 73%|███████▎  | 36/49 [07:12<02:39, 12.28s/it]Epoch 36\n",
      "Loss = 4.4192e-01, PNorm = 102.8839, GNorm = 1.9883, lr_0 = 1.8134e-04\n",
      "Loss = 3.9549e-01, PNorm = 102.9023, GNorm = 1.8302, lr_0 = 1.7946e-04\n",
      "Loss = 3.7269e-01, PNorm = 102.9189, GNorm = 1.2762, lr_0 = 1.7760e-04\n",
      "Loss = 4.3072e-01, PNorm = 102.9375, GNorm = 1.6168, lr_0 = 1.7575e-04\n",
      "Loss = 4.1462e-01, PNorm = 102.9576, GNorm = 1.4891, lr_0 = 1.7393e-04\n",
      "Validation prc-auc = 0.729879\n",
      " 76%|███████▌  | 37/49 [07:25<02:27, 12.28s/it]Epoch 37\n",
      "Loss = 3.9510e-01, PNorm = 102.9784, GNorm = 1.6406, lr_0 = 1.7195e-04\n",
      "Loss = 3.8523e-01, PNorm = 102.9971, GNorm = 3.6376, lr_0 = 1.7017e-04\n",
      "Loss = 4.0788e-01, PNorm = 103.0164, GNorm = 1.6742, lr_0 = 1.6840e-04\n",
      "Loss = 3.9008e-01, PNorm = 103.0370, GNorm = 1.3618, lr_0 = 1.6666e-04\n",
      "Loss = 3.6996e-01, PNorm = 103.0561, GNorm = 2.1714, lr_0 = 1.6493e-04\n",
      "Validation prc-auc = 0.732890\n",
      " 78%|███████▊  | 38/49 [07:37<02:16, 12.37s/it]Epoch 38\n",
      "Loss = 4.2739e-01, PNorm = 103.0759, GNorm = 2.0150, lr_0 = 1.6322e-04\n",
      "Loss = 3.7266e-01, PNorm = 103.0961, GNorm = 1.5987, lr_0 = 1.6152e-04\n",
      "Loss = 4.0328e-01, PNorm = 103.1141, GNorm = 1.2749, lr_0 = 1.5985e-04\n",
      "Loss = 4.0170e-01, PNorm = 103.1329, GNorm = 1.6032, lr_0 = 1.5819e-04\n",
      "Loss = 3.5034e-01, PNorm = 103.1500, GNorm = 1.2491, lr_0 = 1.5655e-04\n",
      "Validation prc-auc = 0.730448\n",
      " 80%|███████▉  | 39/49 [07:50<02:03, 12.36s/it]Epoch 39\n",
      "Loss = 4.0423e-01, PNorm = 103.1649, GNorm = 3.4590, lr_0 = 1.5493e-04\n",
      "Loss = 4.0749e-01, PNorm = 103.1823, GNorm = 2.6038, lr_0 = 1.5332e-04\n",
      "Loss = 3.7462e-01, PNorm = 103.1983, GNorm = 1.7902, lr_0 = 1.5173e-04\n",
      "Loss = 3.6832e-01, PNorm = 103.2140, GNorm = 2.0638, lr_0 = 1.5016e-04\n",
      "Validation prc-auc = 0.726064\n",
      " 82%|████████▏ | 40/49 [08:02<01:50, 12.33s/it]Epoch 40\n",
      "Loss = 3.8487e-01, PNorm = 103.2275, GNorm = 1.6070, lr_0 = 1.4860e-04\n",
      "Loss = 3.5290e-01, PNorm = 103.2421, GNorm = 2.4138, lr_0 = 1.4706e-04\n",
      "Loss = 4.0514e-01, PNorm = 103.2566, GNorm = 1.1793, lr_0 = 1.4554e-04\n",
      "Loss = 3.6971e-01, PNorm = 103.2715, GNorm = 1.2253, lr_0 = 1.4403e-04\n",
      "Loss = 4.0549e-01, PNorm = 103.2859, GNorm = 1.1838, lr_0 = 1.4253e-04\n",
      "Validation prc-auc = 0.728744\n",
      " 84%|████████▎ | 41/49 [08:14<01:38, 12.30s/it]Epoch 41\n",
      "Loss = 4.0692e-01, PNorm = 103.3017, GNorm = 2.3294, lr_0 = 1.4091e-04\n",
      "Loss = 3.6107e-01, PNorm = 103.3157, GNorm = 1.8161, lr_0 = 1.3945e-04\n",
      "Loss = 4.3158e-01, PNorm = 103.3296, GNorm = 2.0411, lr_0 = 1.3800e-04\n",
      "Loss = 3.8727e-01, PNorm = 103.3434, GNorm = 2.1048, lr_0 = 1.3657e-04\n",
      "Loss = 3.5917e-01, PNorm = 103.3583, GNorm = 0.9664, lr_0 = 1.3515e-04\n",
      "Validation prc-auc = 0.727437\n",
      " 86%|████████▌ | 42/49 [08:26<01:26, 12.30s/it]Epoch 42\n",
      "Loss = 4.1430e-01, PNorm = 103.3714, GNorm = 2.0484, lr_0 = 1.3375e-04\n",
      "Loss = 3.7543e-01, PNorm = 103.3872, GNorm = 2.0368, lr_0 = 1.3237e-04\n",
      "Loss = 4.2834e-01, PNorm = 103.4001, GNorm = 1.5786, lr_0 = 1.3099e-04\n",
      "Loss = 3.5447e-01, PNorm = 103.4133, GNorm = 1.7577, lr_0 = 1.2963e-04\n",
      "Loss = 3.9995e-01, PNorm = 103.4242, GNorm = 1.9164, lr_0 = 1.2829e-04\n",
      "Validation prc-auc = 0.734144\n",
      " 88%|████████▊ | 43/49 [08:39<01:14, 12.39s/it]Epoch 43\n",
      "Loss = 3.3649e-01, PNorm = 103.4355, GNorm = 1.3637, lr_0 = 1.2696e-04\n",
      "Loss = 3.6927e-01, PNorm = 103.4467, GNorm = 2.3235, lr_0 = 1.2564e-04\n",
      "Loss = 3.8944e-01, PNorm = 103.4571, GNorm = 1.8026, lr_0 = 1.2434e-04\n",
      "Loss = 3.8420e-01, PNorm = 103.4687, GNorm = 1.6287, lr_0 = 1.2305e-04\n",
      "Validation prc-auc = 0.731557\n",
      " 90%|████████▉ | 44/49 [08:51<01:01, 12.34s/it]Epoch 44\n",
      "Loss = 3.5538e-01, PNorm = 103.4799, GNorm = 2.2236, lr_0 = 1.2165e-04\n",
      "Loss = 3.3368e-01, PNorm = 103.4906, GNorm = 2.1795, lr_0 = 1.2039e-04\n",
      "Loss = 3.9180e-01, PNorm = 103.4997, GNorm = 2.1030, lr_0 = 1.1914e-04\n",
      "Loss = 3.5748e-01, PNorm = 103.5107, GNorm = 1.3978, lr_0 = 1.1790e-04\n",
      "Loss = 3.7379e-01, PNorm = 103.5203, GNorm = 1.9116, lr_0 = 1.1668e-04\n",
      "Validation prc-auc = 0.722937\n",
      " 92%|█████████▏| 45/49 [09:03<00:49, 12.33s/it]Epoch 45\n",
      "Loss = 3.6534e-01, PNorm = 103.5314, GNorm = 2.0698, lr_0 = 1.1547e-04\n",
      "Loss = 3.5860e-01, PNorm = 103.5417, GNorm = 2.5266, lr_0 = 1.1427e-04\n",
      "Loss = 3.4249e-01, PNorm = 103.5502, GNorm = 2.0074, lr_0 = 1.1309e-04\n",
      "Loss = 3.8670e-01, PNorm = 103.5614, GNorm = 2.2272, lr_0 = 1.1192e-04\n",
      "Loss = 4.4395e-01, PNorm = 103.5698, GNorm = 3.2936, lr_0 = 1.1076e-04\n",
      "Validation prc-auc = 0.731044\n",
      " 94%|█████████▍| 46/49 [09:16<00:37, 12.35s/it]Epoch 46\n",
      "Loss = 3.5897e-01, PNorm = 103.5800, GNorm = 1.6338, lr_0 = 1.0961e-04\n",
      "Loss = 3.2715e-01, PNorm = 103.5895, GNorm = 1.2976, lr_0 = 1.0847e-04\n",
      "Loss = 3.4290e-01, PNorm = 103.5986, GNorm = 1.9580, lr_0 = 1.0735e-04\n",
      "Loss = 3.4036e-01, PNorm = 103.6072, GNorm = 1.4277, lr_0 = 1.0623e-04\n",
      "Loss = 4.3518e-01, PNorm = 103.6140, GNorm = 2.1300, lr_0 = 1.0513e-04\n",
      "Validation prc-auc = 0.731099\n",
      " 96%|█████████▌| 47/49 [09:28<00:24, 12.32s/it]Epoch 47\n",
      "Loss = 3.6067e-01, PNorm = 103.6237, GNorm = 1.7237, lr_0 = 1.0393e-04\n",
      "Loss = 3.7243e-01, PNorm = 103.6312, GNorm = 1.5077, lr_0 = 1.0285e-04\n",
      "Loss = 3.9727e-01, PNorm = 103.6384, GNorm = 1.3241, lr_0 = 1.0179e-04\n",
      "Loss = 3.4225e-01, PNorm = 103.6475, GNorm = 0.9065, lr_0 = 1.0073e-04\n",
      "Validation prc-auc = 0.733490\n",
      " 98%|█████████▊| 48/49 [09:40<00:12, 12.31s/it]Epoch 48\n",
      "Loss = 3.6779e-01, PNorm = 103.6554, GNorm = 2.3459, lr_0 = 1.0000e-04\n",
      "Loss = 3.6082e-01, PNorm = 103.6636, GNorm = 1.3462, lr_0 = 1.0000e-04\n",
      "Loss = 3.7138e-01, PNorm = 103.6726, GNorm = 1.9617, lr_0 = 1.0000e-04\n",
      "Loss = 3.5044e-01, PNorm = 103.6815, GNorm = 1.5092, lr_0 = 1.0000e-04\n",
      "Loss = 3.6957e-01, PNorm = 103.6885, GNorm = 2.6978, lr_0 = 1.0000e-04\n",
      "Validation prc-auc = 0.733983\n",
      "100%|██████████| 49/49 [09:53<00:00, 12.11s/it]\n",
      "Model 0 best validation prc-auc = 0.741242 on epoch 33\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"ffn.1.weight\".\n",
      "Loading pretrained parameter \"ffn.1.bias\".\n",
      "Loading pretrained parameter \"ffn.4.weight\".\n",
      "Loading pretrained parameter \"ffn.4.bias\".\n",
      "Loading pretrained parameter \"ffn.7.weight\".\n",
      "Loading pretrained parameter \"ffn.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test prc-auc = 0.741242                \n",
      "Ensemble test prc-auc = 0.741242\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test prc-auc = 0.741242\n",
      "Overall test prc-auc = 0.741242 +/- 0.000000\n",
      "Elapsed time = 0:09:57\n",
      "Command line\n",
      "python /home/steshin/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"6c604d94-190d-4da2-9c36-788708df5377\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/steshin/.local/share/jupyter/runtime/kernel-v2-2822374BRuswu5zWdXq.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_feature_scaling': True,\n",
      " 'bond_features_path': None,\n",
      " 'bond_features_size': 0,\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'classification',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=1),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 49,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': None,\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': True,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 1,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'binary_cross_entropy',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'prc-auc',\n",
      " 'metrics': ['prc-auc'],\n",
      " 'minimize_score': False,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_features_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_features_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_features_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': False,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "2385it [00:00, 364316.96it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 325632.00it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 170189.78it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "1190it [00:00, 389878.28it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 316480.99it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 186497.10it/s]\n",
      "1190it [00:00, 382322.62it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 369200.51it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 189111.57it/s]\n",
      "Class sizes\n",
      "targets 0: 29.39%, 1: 70.61%\n",
      "Total size = 2,385 | train size = 2,385 | val size = 1,190 | test size = 1,190\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (sigmoid): Sigmoid()\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout_layer): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (ffn): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=3600, out_features=600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.7, inplace=False)\n",
      "    (4): Linear(in_features=600, out_features=600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.7, inplace=False)\n",
      "    (7): Linear(in_features=600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 29,457,001\n",
      "Moving model to cuda\n",
      "  0%|          | 0/49 [00:00<?, ?it/s]Epoch 0\n",
      "Loss = 1.0067e+00, PNorm = 95.8215, GNorm = 11.3097, lr_0 = 2.0532e-04\n",
      "Loss = 8.2540e-01, PNorm = 95.8920, GNorm = 4.7372, lr_0 = 3.0106e-04\n",
      "Loss = 6.7640e-01, PNorm = 95.9742, GNorm = 3.5823, lr_0 = 3.9681e-04\n",
      "Loss = 6.1312e-01, PNorm = 96.0487, GNorm = 2.5055, lr_0 = 4.9255e-04\n",
      "Validation prc-auc = 0.615862\n",
      "  2%|▏         | 1/49 [00:12<09:57, 12.44s/it]Epoch 1\n",
      "Loss = 6.1991e-01, PNorm = 96.1183, GNorm = 2.2756, lr_0 = 5.9787e-04\n",
      "Loss = 6.4763e-01, PNorm = 96.1786, GNorm = 2.1096, lr_0 = 6.9362e-04\n",
      "Loss = 6.4850e-01, PNorm = 96.2327, GNorm = 2.1754, lr_0 = 7.8936e-04\n",
      "Loss = 6.1910e-01, PNorm = 96.2873, GNorm = 1.6985, lr_0 = 8.8511e-04\n",
      "Loss = 6.2604e-01, PNorm = 96.3436, GNorm = 1.7381, lr_0 = 9.8085e-04\n",
      "Validation prc-auc = 0.629335\n",
      "  4%|▍         | 2/49 [00:24<09:46, 12.48s/it]Epoch 2\n",
      "Loss = 6.2445e-01, PNorm = 96.4006, GNorm = 1.5906, lr_0 = 9.9170e-04\n",
      "Loss = 6.0673e-01, PNorm = 96.4588, GNorm = 1.5449, lr_0 = 9.8141e-04\n",
      "Loss = 6.5753e-01, PNorm = 96.5077, GNorm = 1.1993, lr_0 = 9.7124e-04\n",
      "Loss = 6.1372e-01, PNorm = 96.5569, GNorm = 1.1501, lr_0 = 9.6116e-04\n",
      "Loss = 5.8741e-01, PNorm = 96.5987, GNorm = 1.5248, lr_0 = 9.5120e-04\n",
      "Validation prc-auc = 0.635690\n",
      "  6%|▌         | 3/49 [00:37<09:40, 12.61s/it]Epoch 3\n",
      "Loss = 6.1903e-01, PNorm = 96.6363, GNorm = 1.1153, lr_0 = 9.4133e-04\n",
      "Loss = 5.9095e-01, PNorm = 96.6750, GNorm = 1.1666, lr_0 = 9.3157e-04\n",
      "Loss = 6.3447e-01, PNorm = 96.7094, GNorm = 1.1577, lr_0 = 9.2191e-04\n",
      "Loss = 6.0546e-01, PNorm = 96.7454, GNorm = 1.1495, lr_0 = 9.1235e-04\n",
      "Loss = 6.1925e-01, PNorm = 96.7774, GNorm = 1.0267, lr_0 = 9.0289e-04\n",
      "Loss = 5.3680e-01, PNorm = 96.7807, GNorm = 1.1632, lr_0 = 9.0195e-04\n",
      "Validation prc-auc = 0.641041\n",
      "  8%|▊         | 4/49 [00:50<09:25, 12.57s/it]Epoch 4\n",
      "Loss = 6.1236e-01, PNorm = 96.8128, GNorm = 0.9591, lr_0 = 8.9260e-04\n",
      "Loss = 5.9317e-01, PNorm = 96.8448, GNorm = 1.0099, lr_0 = 8.8334e-04\n",
      "Loss = 5.9902e-01, PNorm = 96.8771, GNorm = 1.0602, lr_0 = 8.7418e-04\n",
      "Loss = 6.0361e-01, PNorm = 96.9112, GNorm = 1.0944, lr_0 = 8.6512e-04\n",
      "Validation prc-auc = 0.660186\n",
      " 10%|█         | 5/49 [01:02<09:10, 12.50s/it]Epoch 5\n",
      "Loss = 5.9755e-01, PNorm = 96.9443, GNorm = 0.9007, lr_0 = 8.5615e-04\n",
      "Loss = 6.1481e-01, PNorm = 96.9818, GNorm = 0.9244, lr_0 = 8.4727e-04\n",
      "Loss = 5.8683e-01, PNorm = 97.0160, GNorm = 1.0581, lr_0 = 8.3848e-04\n",
      "Loss = 6.0921e-01, PNorm = 97.0481, GNorm = 1.1509, lr_0 = 8.2979e-04\n",
      "Loss = 5.9022e-01, PNorm = 97.0812, GNorm = 1.1127, lr_0 = 8.2118e-04\n",
      "Validation prc-auc = 0.651851\n",
      " 12%|█▏        | 6/49 [01:14<08:54, 12.44s/it]Epoch 6\n",
      "Loss = 5.7595e-01, PNorm = 97.1133, GNorm = 0.9377, lr_0 = 8.1267e-04\n",
      "Loss = 6.1230e-01, PNorm = 97.1476, GNorm = 1.0435, lr_0 = 8.0424e-04\n",
      "Loss = 6.2784e-01, PNorm = 97.1783, GNorm = 0.8401, lr_0 = 7.9590e-04\n",
      "Loss = 5.8118e-01, PNorm = 97.2112, GNorm = 1.2101, lr_0 = 7.8765e-04\n",
      "Loss = 5.9307e-01, PNorm = 97.2455, GNorm = 0.8913, lr_0 = 7.7948e-04\n",
      "Validation prc-auc = 0.655969\n",
      " 14%|█▍        | 7/49 [01:27<08:40, 12.39s/it]Epoch 7\n",
      "Loss = 6.4780e-01, PNorm = 97.2792, GNorm = 1.0028, lr_0 = 7.7060e-04\n",
      "Loss = 6.0253e-01, PNorm = 97.3069, GNorm = 0.7932, lr_0 = 7.6261e-04\n",
      "Loss = 5.9209e-01, PNorm = 97.3315, GNorm = 1.2744, lr_0 = 7.5470e-04\n",
      "Loss = 5.9137e-01, PNorm = 97.3523, GNorm = 0.8005, lr_0 = 7.4687e-04\n",
      "Loss = 6.1059e-01, PNorm = 97.3749, GNorm = 0.8399, lr_0 = 7.3913e-04\n",
      "Validation prc-auc = 0.664513\n",
      " 16%|█▋        | 8/49 [01:39<08:31, 12.47s/it]Epoch 8\n",
      "Loss = 5.5741e-01, PNorm = 97.3986, GNorm = 0.8739, lr_0 = 7.3146e-04\n",
      "Loss = 6.2573e-01, PNorm = 97.4220, GNorm = 0.7532, lr_0 = 7.2388e-04\n",
      "Loss = 5.9088e-01, PNorm = 97.4468, GNorm = 1.2770, lr_0 = 7.1637e-04\n",
      "Loss = 5.9256e-01, PNorm = 97.4694, GNorm = 0.7629, lr_0 = 7.0894e-04\n",
      "Validation prc-auc = 0.672864\n",
      " 18%|█▊        | 9/49 [01:52<08:22, 12.57s/it]Epoch 9\n",
      "Loss = 6.5881e-01, PNorm = 97.4916, GNorm = 0.8419, lr_0 = 7.0159e-04\n",
      "Loss = 5.8727e-01, PNorm = 97.5139, GNorm = 0.7291, lr_0 = 6.9432e-04\n",
      "Loss = 5.8728e-01, PNorm = 97.5374, GNorm = 1.0385, lr_0 = 6.8712e-04\n",
      "Loss = 5.8502e-01, PNorm = 97.5633, GNorm = 1.0428, lr_0 = 6.7999e-04\n",
      "Loss = 6.2082e-01, PNorm = 97.5899, GNorm = 0.7921, lr_0 = 6.7294e-04\n",
      "Validation prc-auc = 0.673715\n",
      " 20%|██        | 10/49 [02:05<08:10, 12.56s/it]Epoch 10\n",
      "Loss = 5.7459e-01, PNorm = 97.6175, GNorm = 1.3166, lr_0 = 6.6596e-04\n",
      "Loss = 5.6504e-01, PNorm = 97.6417, GNorm = 0.7604, lr_0 = 6.5906e-04\n",
      "Loss = 5.5505e-01, PNorm = 97.6662, GNorm = 0.7163, lr_0 = 6.5222e-04\n",
      "Loss = 5.8819e-01, PNorm = 97.6906, GNorm = 1.0963, lr_0 = 6.4546e-04\n",
      "Loss = 5.9150e-01, PNorm = 97.7150, GNorm = 0.7214, lr_0 = 6.3877e-04\n",
      "Validation prc-auc = 0.688644\n",
      " 22%|██▏       | 11/49 [02:17<07:56, 12.54s/it]Epoch 11\n",
      "Loss = 5.8862e-01, PNorm = 97.7485, GNorm = 0.7999, lr_0 = 6.3148e-04\n",
      "Loss = 5.8824e-01, PNorm = 97.7823, GNorm = 0.8205, lr_0 = 6.2494e-04\n",
      "Loss = 5.3623e-01, PNorm = 97.8175, GNorm = 0.8394, lr_0 = 6.1846e-04\n",
      "Loss = 5.8235e-01, PNorm = 97.8538, GNorm = 0.7945, lr_0 = 6.1204e-04\n",
      "Loss = 5.7764e-01, PNorm = 97.8898, GNorm = 0.8961, lr_0 = 6.0570e-04\n",
      "Validation prc-auc = 0.679210\n",
      " 24%|██▍       | 12/49 [02:30<07:42, 12.51s/it]Epoch 12\n",
      "Loss = 5.7526e-01, PNorm = 97.9272, GNorm = 0.8109, lr_0 = 5.9941e-04\n",
      "Loss = 5.9038e-01, PNorm = 97.9731, GNorm = 1.1532, lr_0 = 5.9320e-04\n",
      "Loss = 5.5518e-01, PNorm = 98.0209, GNorm = 0.8471, lr_0 = 5.8705e-04\n",
      "Loss = 5.5728e-01, PNorm = 98.0601, GNorm = 0.8460, lr_0 = 5.8096e-04\n",
      "Loss = 5.5681e-01, PNorm = 98.0981, GNorm = 0.8468, lr_0 = 5.7494e-04\n",
      "Validation prc-auc = 0.688309\n",
      " 27%|██▋       | 13/49 [02:42<07:29, 12.49s/it]Epoch 13\n",
      "Loss = 5.6598e-01, PNorm = 98.1387, GNorm = 0.8266, lr_0 = 5.6897e-04\n",
      "Loss = 5.3870e-01, PNorm = 98.1848, GNorm = 0.9767, lr_0 = 5.6307e-04\n",
      "Loss = 5.4043e-01, PNorm = 98.2379, GNorm = 1.1197, lr_0 = 5.5724e-04\n",
      "Loss = 5.4619e-01, PNorm = 98.2980, GNorm = 0.8256, lr_0 = 5.5146e-04\n",
      "Validation prc-auc = 0.699077\n",
      " 29%|██▊       | 14/49 [02:55<07:17, 12.49s/it]Epoch 14\n",
      "Loss = 5.3569e-01, PNorm = 98.3714, GNorm = 0.8903, lr_0 = 5.4517e-04\n",
      "Loss = 5.6463e-01, PNorm = 98.4409, GNorm = 1.2626, lr_0 = 5.3952e-04\n",
      "Loss = 5.4523e-01, PNorm = 98.5052, GNorm = 1.1145, lr_0 = 5.3392e-04\n",
      "Loss = 5.6643e-01, PNorm = 98.5639, GNorm = 0.9076, lr_0 = 5.2839e-04\n",
      "Loss = 5.5523e-01, PNorm = 98.6153, GNorm = 0.7693, lr_0 = 5.2291e-04\n",
      "Validation prc-auc = 0.691737\n",
      " 31%|███       | 15/49 [03:07<07:03, 12.46s/it]Epoch 15\n",
      "Loss = 5.3118e-01, PNorm = 98.6636, GNorm = 0.9687, lr_0 = 5.1748e-04\n",
      "Loss = 5.3933e-01, PNorm = 98.7119, GNorm = 0.8625, lr_0 = 5.1212e-04\n",
      "Loss = 5.4049e-01, PNorm = 98.7619, GNorm = 0.8584, lr_0 = 5.0681e-04\n",
      "Loss = 5.4891e-01, PNorm = 98.8204, GNorm = 0.8701, lr_0 = 5.0155e-04\n",
      "Loss = 6.0999e-01, PNorm = 98.8840, GNorm = 1.5771, lr_0 = 4.9635e-04\n",
      "Validation prc-auc = 0.698665\n",
      " 33%|███▎      | 16/49 [03:20<06:54, 12.56s/it]Epoch 16\n",
      "Loss = 5.5149e-01, PNorm = 98.9355, GNorm = 0.8400, lr_0 = 4.9121e-04\n",
      "Loss = 5.6923e-01, PNorm = 98.9801, GNorm = 0.8205, lr_0 = 4.8611e-04\n",
      "Loss = 5.0741e-01, PNorm = 99.0231, GNorm = 0.9529, lr_0 = 4.8107e-04\n",
      "Loss = 5.1714e-01, PNorm = 99.0660, GNorm = 1.3596, lr_0 = 4.7608e-04\n",
      "Loss = 5.4610e-01, PNorm = 99.1139, GNorm = 1.2540, lr_0 = 4.7115e-04\n",
      "Loss = 5.4559e-01, PNorm = 99.1190, GNorm = 1.1154, lr_0 = 4.7065e-04\n",
      "Validation prc-auc = 0.703012\n",
      " 35%|███▍      | 17/49 [03:32<06:41, 12.56s/it]Epoch 17\n",
      "Loss = 5.6096e-01, PNorm = 99.1730, GNorm = 0.8506, lr_0 = 4.6577e-04\n",
      "Loss = 4.6652e-01, PNorm = 99.2311, GNorm = 1.2833, lr_0 = 4.6094e-04\n",
      "Loss = 5.7133e-01, PNorm = 99.2952, GNorm = 1.4062, lr_0 = 4.5616e-04\n",
      "Loss = 5.1146e-01, PNorm = 99.3744, GNorm = 0.9661, lr_0 = 4.5143e-04\n",
      "Validation prc-auc = 0.702302\n",
      " 37%|███▋      | 18/49 [03:45<06:27, 12.49s/it]Epoch 18\n",
      "Loss = 4.5711e-01, PNorm = 99.4486, GNorm = 0.8978, lr_0 = 4.4675e-04\n",
      "Loss = 5.1450e-01, PNorm = 99.5158, GNorm = 1.0773, lr_0 = 4.4212e-04\n",
      "Loss = 5.4205e-01, PNorm = 99.5852, GNorm = 0.9560, lr_0 = 4.3754e-04\n",
      "Loss = 5.7246e-01, PNorm = 99.6483, GNorm = 1.1926, lr_0 = 4.3300e-04\n",
      "Loss = 4.6836e-01, PNorm = 99.7024, GNorm = 0.8893, lr_0 = 4.2851e-04\n",
      "Validation prc-auc = 0.715082\n",
      " 39%|███▉      | 19/49 [03:57<06:14, 12.49s/it]Epoch 19\n",
      "Loss = 4.8704e-01, PNorm = 99.7477, GNorm = 0.8783, lr_0 = 4.2407e-04\n",
      "Loss = 4.9577e-01, PNorm = 99.7995, GNorm = 1.4950, lr_0 = 4.1967e-04\n",
      "Loss = 5.3146e-01, PNorm = 99.8667, GNorm = 1.1820, lr_0 = 4.1532e-04\n",
      "Loss = 5.1071e-01, PNorm = 99.9379, GNorm = 1.1795, lr_0 = 4.1101e-04\n",
      "Loss = 5.0250e-01, PNorm = 100.0001, GNorm = 1.0708, lr_0 = 4.0675e-04\n",
      "Validation prc-auc = 0.713267\n",
      " 41%|████      | 20/49 [04:09<06:01, 12.46s/it]Epoch 20\n",
      "Loss = 5.1530e-01, PNorm = 100.0550, GNorm = 2.5589, lr_0 = 4.0253e-04\n",
      "Loss = 4.7558e-01, PNorm = 100.1062, GNorm = 0.8899, lr_0 = 3.9836e-04\n",
      "Loss = 5.1477e-01, PNorm = 100.1580, GNorm = 1.3610, lr_0 = 3.9423e-04\n",
      "Loss = 4.8478e-01, PNorm = 100.2147, GNorm = 0.9908, lr_0 = 3.9014e-04\n",
      "Loss = 5.1785e-01, PNorm = 100.2678, GNorm = 1.3075, lr_0 = 3.8609e-04\n",
      "Validation prc-auc = 0.697765\n",
      " 43%|████▎     | 21/49 [04:22<05:49, 12.48s/it]Epoch 21\n",
      "Loss = 4.8804e-01, PNorm = 100.3286, GNorm = 1.9389, lr_0 = 3.8169e-04\n",
      "Loss = 4.4829e-01, PNorm = 100.3923, GNorm = 0.9990, lr_0 = 3.7773e-04\n",
      "Loss = 5.3973e-01, PNorm = 100.4597, GNorm = 1.1261, lr_0 = 3.7382e-04\n",
      "Loss = 4.5359e-01, PNorm = 100.5230, GNorm = 1.4720, lr_0 = 3.6994e-04\n",
      "Validation prc-auc = 0.730478\n",
      " 45%|████▍     | 22/49 [04:35<05:38, 12.55s/it]Epoch 22\n",
      "Loss = 5.0334e-01, PNorm = 100.5881, GNorm = 1.4204, lr_0 = 3.6610e-04\n",
      "Loss = 5.2330e-01, PNorm = 100.6420, GNorm = 1.1426, lr_0 = 3.6231e-04\n",
      "Loss = 4.4600e-01, PNorm = 100.6945, GNorm = 1.3572, lr_0 = 3.5855e-04\n",
      "Loss = 4.6355e-01, PNorm = 100.7440, GNorm = 1.0567, lr_0 = 3.5483e-04\n",
      "Loss = 5.2424e-01, PNorm = 100.7986, GNorm = 1.2341, lr_0 = 3.5115e-04\n",
      "Validation prc-auc = 0.710172\n",
      " 47%|████▋     | 23/49 [04:47<05:25, 12.51s/it]Epoch 23\n",
      "Loss = 4.8506e-01, PNorm = 100.8470, GNorm = 1.5420, lr_0 = 3.4751e-04\n",
      "Loss = 4.8682e-01, PNorm = 100.8904, GNorm = 0.9928, lr_0 = 3.4391e-04\n",
      "Loss = 4.5869e-01, PNorm = 100.9296, GNorm = 2.0953, lr_0 = 3.4034e-04\n",
      "Loss = 5.0980e-01, PNorm = 100.9674, GNorm = 1.1891, lr_0 = 3.3681e-04\n",
      "Loss = 4.5286e-01, PNorm = 101.0165, GNorm = 0.9336, lr_0 = 3.3332e-04\n",
      "Validation prc-auc = 0.728259\n",
      " 49%|████▉     | 24/49 [05:00<05:11, 12.48s/it]Epoch 24\n",
      "Loss = 4.8516e-01, PNorm = 101.0666, GNorm = 1.8970, lr_0 = 3.2952e-04\n",
      "Loss = 4.8621e-01, PNorm = 101.1131, GNorm = 1.4264, lr_0 = 3.2610e-04\n",
      "Loss = 4.3167e-01, PNorm = 101.1564, GNorm = 1.1878, lr_0 = 3.2272e-04\n",
      "Loss = 4.2437e-01, PNorm = 101.2023, GNorm = 2.7617, lr_0 = 3.1937e-04\n",
      "Loss = 4.8904e-01, PNorm = 101.2491, GNorm = 1.7485, lr_0 = 3.1606e-04\n",
      "Validation prc-auc = 0.733935\n",
      " 51%|█████     | 25/49 [05:12<04:59, 12.50s/it]Epoch 25\n",
      "Loss = 5.2475e-01, PNorm = 101.2964, GNorm = 2.3993, lr_0 = 3.1279e-04\n",
      "Loss = 4.6621e-01, PNorm = 101.3451, GNorm = 1.2041, lr_0 = 3.0954e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.3867, GNorm = 1.1062, lr_0 = 3.0633e-04\n",
      "Loss = 4.7162e-01, PNorm = 101.4270, GNorm = 1.3346, lr_0 = 3.0316e-04\n",
      "Loss = 4.3106e-01, PNorm = 101.4674, GNorm = 1.6084, lr_0 = 3.0001e-04\n",
      "Validation prc-auc = 0.729222\n",
      " 53%|█████▎    | 26/49 [05:24<04:46, 12.45s/it]Epoch 26\n",
      "Loss = 4.3461e-01, PNorm = 101.5064, GNorm = 1.1614, lr_0 = 2.9690e-04\n",
      "Loss = 4.8308e-01, PNorm = 101.5477, GNorm = 2.9387, lr_0 = 2.9382e-04\n",
      "Loss = 4.4844e-01, PNorm = 101.5879, GNorm = 1.3525, lr_0 = 2.9078e-04\n",
      "Loss = 4.5905e-01, PNorm = 101.6276, GNorm = 1.7554, lr_0 = 2.8776e-04\n",
      "Validation prc-auc = 0.723556\n",
      " 55%|█████▌    | 27/49 [05:37<04:34, 12.49s/it]Epoch 27\n",
      "Loss = 3.8075e-01, PNorm = 101.6739, GNorm = 1.2324, lr_0 = 2.8448e-04\n",
      "Loss = 4.4958e-01, PNorm = 101.7146, GNorm = 1.6542, lr_0 = 2.8153e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.7589, GNorm = 1.4257, lr_0 = 2.7861e-04\n",
      "Loss = 4.2466e-01, PNorm = 101.8007, GNorm = 1.7038, lr_0 = 2.7572e-04\n",
      "Loss = 4.7970e-01, PNorm = 101.8378, GNorm = 1.3090, lr_0 = 2.7286e-04\n",
      "Validation prc-auc = 0.707338\n",
      " 57%|█████▋    | 28/49 [05:49<04:22, 12.48s/it]Epoch 28\n",
      "Loss = 4.5278e-01, PNorm = 101.8740, GNorm = 1.3734, lr_0 = 2.7003e-04\n",
      "Loss = 4.5094e-01, PNorm = 101.9079, GNorm = 1.0547, lr_0 = 2.6723e-04\n",
      "Loss = 4.1357e-01, PNorm = 101.9411, GNorm = 1.5816, lr_0 = 2.6446e-04\n",
      "Loss = 4.6498e-01, PNorm = 101.9734, GNorm = 1.8609, lr_0 = 2.6172e-04\n",
      "Loss = 4.2933e-01, PNorm = 102.0062, GNorm = 1.0863, lr_0 = 2.5901e-04\n",
      "Validation prc-auc = 0.699879\n",
      " 59%|█████▉    | 29/49 [06:02<04:08, 12.44s/it]Epoch 29\n",
      "Loss = 3.9687e-01, PNorm = 102.0364, GNorm = 1.0911, lr_0 = 2.5632e-04\n",
      "Loss = 3.9953e-01, PNorm = 102.0640, GNorm = 1.2628, lr_0 = 2.5366e-04\n",
      "Loss = 4.5717e-01, PNorm = 102.0935, GNorm = 1.8129, lr_0 = 2.5103e-04\n",
      "Loss = 4.1537e-01, PNorm = 102.1263, GNorm = 1.2622, lr_0 = 2.4843e-04\n",
      "Loss = 4.6298e-01, PNorm = 102.1587, GNorm = 1.6679, lr_0 = 2.4585e-04\n",
      "Validation prc-auc = 0.729581\n",
      " 61%|██████    | 30/49 [06:14<03:56, 12.43s/it]Epoch 30\n",
      "Loss = 4.4116e-01, PNorm = 102.1918, GNorm = 2.3824, lr_0 = 2.4330e-04\n",
      "Loss = 4.4225e-01, PNorm = 102.2200, GNorm = 2.0057, lr_0 = 2.4078e-04\n",
      "Loss = 4.1512e-01, PNorm = 102.2495, GNorm = 1.2579, lr_0 = 2.3828e-04\n",
      "Loss = 4.3965e-01, PNorm = 102.2783, GNorm = 1.9444, lr_0 = 2.3581e-04\n",
      "Validation prc-auc = 0.721862\n",
      " 63%|██████▎   | 31/49 [06:27<03:43, 12.43s/it]Epoch 31\n",
      "Loss = 4.1521e-01, PNorm = 102.3138, GNorm = 2.0351, lr_0 = 2.3312e-04\n",
      "Loss = 4.6530e-01, PNorm = 102.3409, GNorm = 0.9553, lr_0 = 2.3071e-04\n",
      "Loss = 4.4350e-01, PNorm = 102.3687, GNorm = 1.5819, lr_0 = 2.2831e-04\n",
      "Loss = 4.1122e-01, PNorm = 102.3959, GNorm = 1.5397, lr_0 = 2.2595e-04\n",
      "Loss = 3.9777e-01, PNorm = 102.4228, GNorm = 0.9937, lr_0 = 2.2360e-04\n",
      "Validation prc-auc = 0.721970\n",
      " 65%|██████▌   | 32/49 [06:39<03:33, 12.53s/it]Epoch 32\n",
      "Loss = 4.3843e-01, PNorm = 102.4485, GNorm = 3.1887, lr_0 = 2.2129e-04\n",
      "Loss = 3.8235e-01, PNorm = 102.4765, GNorm = 1.1239, lr_0 = 2.1899e-04\n",
      "Loss = 4.2292e-01, PNorm = 102.5009, GNorm = 1.9876, lr_0 = 2.1672e-04\n",
      "Loss = 4.3276e-01, PNorm = 102.5277, GNorm = 1.5407, lr_0 = 2.1447e-04\n",
      "Loss = 4.6404e-01, PNorm = 102.5524, GNorm = 1.9581, lr_0 = 2.1225e-04\n",
      "Validation prc-auc = 0.704753\n",
      " 67%|██████▋   | 33/49 [06:52<03:19, 12.50s/it]Epoch 33\n",
      "Loss = 4.0377e-01, PNorm = 102.5779, GNorm = 1.4487, lr_0 = 2.1005e-04\n",
      "Loss = 4.3812e-01, PNorm = 102.6001, GNorm = 1.7061, lr_0 = 2.0787e-04\n",
      "Loss = 4.1834e-01, PNorm = 102.6218, GNorm = 1.3299, lr_0 = 2.0571e-04\n",
      "Loss = 4.0906e-01, PNorm = 102.6444, GNorm = 1.2884, lr_0 = 2.0358e-04\n",
      "Loss = 4.0979e-01, PNorm = 102.6662, GNorm = 1.7456, lr_0 = 2.0147e-04\n",
      "Validation prc-auc = 0.741242\n",
      " 69%|██████▉   | 34/49 [07:04<03:07, 12.52s/it]Epoch 34\n",
      "Loss = 4.2813e-01, PNorm = 102.6889, GNorm = 2.0504, lr_0 = 1.9917e-04\n",
      "Loss = 4.2911e-01, PNorm = 102.7107, GNorm = 2.0385, lr_0 = 1.9711e-04\n",
      "Loss = 4.0048e-01, PNorm = 102.7322, GNorm = 1.4560, lr_0 = 1.9506e-04\n",
      "Loss = 3.9704e-01, PNorm = 102.7581, GNorm = 1.1820, lr_0 = 1.9304e-04\n",
      "Validation prc-auc = 0.727587\n",
      " 71%|███████▏  | 35/49 [07:17<02:54, 12.49s/it]Epoch 35\n",
      "Loss = 3.3330e-01, PNorm = 102.7780, GNorm = 1.1825, lr_0 = 1.9104e-04\n",
      "Loss = 3.8412e-01, PNorm = 102.7992, GNorm = 1.7658, lr_0 = 1.8906e-04\n",
      "Loss = 3.7517e-01, PNorm = 102.8210, GNorm = 1.2284, lr_0 = 1.8710e-04\n",
      "Loss = 4.5571e-01, PNorm = 102.8433, GNorm = 2.2784, lr_0 = 1.8516e-04\n",
      "Loss = 3.8375e-01, PNorm = 102.8635, GNorm = 1.3376, lr_0 = 1.8324e-04\n",
      "Validation prc-auc = 0.724475\n",
      " 73%|███████▎  | 36/49 [07:29<02:42, 12.48s/it]Epoch 36\n",
      "Loss = 4.4192e-01, PNorm = 102.8839, GNorm = 1.9883, lr_0 = 1.8134e-04\n",
      "Loss = 3.9549e-01, PNorm = 102.9023, GNorm = 1.8302, lr_0 = 1.7946e-04\n",
      "Loss = 3.7269e-01, PNorm = 102.9189, GNorm = 1.2762, lr_0 = 1.7760e-04\n",
      "Loss = 4.3072e-01, PNorm = 102.9375, GNorm = 1.6168, lr_0 = 1.7575e-04\n",
      "Loss = 4.1462e-01, PNorm = 102.9576, GNorm = 1.4891, lr_0 = 1.7393e-04\n",
      "Validation prc-auc = 0.729879\n",
      " 76%|███████▌  | 37/49 [07:42<02:29, 12.48s/it]Epoch 37\n",
      "Loss = 3.9510e-01, PNorm = 102.9784, GNorm = 1.6406, lr_0 = 1.7195e-04\n",
      "Loss = 3.8523e-01, PNorm = 102.9971, GNorm = 3.6376, lr_0 = 1.7017e-04\n",
      "Loss = 4.0788e-01, PNorm = 103.0164, GNorm = 1.6742, lr_0 = 1.6840e-04\n",
      "Loss = 3.9008e-01, PNorm = 103.0370, GNorm = 1.3618, lr_0 = 1.6666e-04\n",
      "Loss = 3.6996e-01, PNorm = 103.0561, GNorm = 2.1714, lr_0 = 1.6493e-04\n",
      "Validation prc-auc = 0.732890\n",
      " 78%|███████▊  | 38/49 [07:55<02:18, 12.58s/it]Epoch 38\n",
      "Loss = 4.2739e-01, PNorm = 103.0759, GNorm = 2.0150, lr_0 = 1.6322e-04\n",
      "Loss = 3.7266e-01, PNorm = 103.0961, GNorm = 1.5987, lr_0 = 1.6152e-04\n",
      "Loss = 4.0328e-01, PNorm = 103.1141, GNorm = 1.2749, lr_0 = 1.5985e-04\n",
      "Loss = 4.0170e-01, PNorm = 103.1329, GNorm = 1.6032, lr_0 = 1.5819e-04\n",
      "Loss = 3.5034e-01, PNorm = 103.1500, GNorm = 1.2491, lr_0 = 1.5655e-04\n",
      "Validation prc-auc = 0.730448\n",
      " 80%|███████▉  | 39/49 [08:07<02:05, 12.55s/it]Epoch 39\n",
      "Loss = 4.0423e-01, PNorm = 103.1649, GNorm = 3.4590, lr_0 = 1.5493e-04\n",
      "Loss = 4.0749e-01, PNorm = 103.1823, GNorm = 2.6038, lr_0 = 1.5332e-04\n",
      "Loss = 3.7462e-01, PNorm = 103.1983, GNorm = 1.7902, lr_0 = 1.5173e-04\n",
      "Loss = 3.6832e-01, PNorm = 103.2140, GNorm = 2.0638, lr_0 = 1.5016e-04\n",
      "Validation prc-auc = 0.726064\n",
      " 82%|████████▏ | 40/49 [08:20<01:52, 12.55s/it]Epoch 40\n",
      "Loss = 3.8487e-01, PNorm = 103.2275, GNorm = 1.6070, lr_0 = 1.4860e-04\n",
      "Loss = 3.5290e-01, PNorm = 103.2421, GNorm = 2.4138, lr_0 = 1.4706e-04\n",
      "Loss = 4.0514e-01, PNorm = 103.2566, GNorm = 1.1793, lr_0 = 1.4554e-04\n",
      "Loss = 3.6971e-01, PNorm = 103.2715, GNorm = 1.2253, lr_0 = 1.4403e-04\n",
      "Loss = 4.0549e-01, PNorm = 103.2859, GNorm = 1.1838, lr_0 = 1.4253e-04\n",
      "Validation prc-auc = 0.728744\n",
      " 84%|████████▎ | 41/49 [08:32<01:40, 12.62s/it]Epoch 41\n",
      "Loss = 4.0692e-01, PNorm = 103.3017, GNorm = 2.3294, lr_0 = 1.4091e-04\n",
      "Loss = 3.6107e-01, PNorm = 103.3157, GNorm = 1.8161, lr_0 = 1.3945e-04\n",
      "Loss = 4.3158e-01, PNorm = 103.3296, GNorm = 2.0411, lr_0 = 1.3800e-04\n",
      "Loss = 3.8727e-01, PNorm = 103.3434, GNorm = 2.1048, lr_0 = 1.3657e-04\n",
      "Loss = 3.5917e-01, PNorm = 103.3583, GNorm = 0.9664, lr_0 = 1.3515e-04\n",
      "Validation prc-auc = 0.727437\n",
      " 86%|████████▌ | 42/49 [08:45<01:28, 12.66s/it]Epoch 42\n",
      "Loss = 4.1430e-01, PNorm = 103.3714, GNorm = 2.0484, lr_0 = 1.3375e-04\n",
      "Loss = 3.7543e-01, PNorm = 103.3872, GNorm = 2.0368, lr_0 = 1.3237e-04\n",
      "Loss = 4.2834e-01, PNorm = 103.4001, GNorm = 1.5786, lr_0 = 1.3099e-04\n",
      "Loss = 3.5447e-01, PNorm = 103.4133, GNorm = 1.7577, lr_0 = 1.2963e-04\n",
      "Loss = 3.9995e-01, PNorm = 103.4242, GNorm = 1.9164, lr_0 = 1.2829e-04\n",
      "Validation prc-auc = 0.734144\n",
      " 88%|████████▊ | 43/49 [08:58<01:15, 12.59s/it]Epoch 43\n",
      "Loss = 3.3649e-01, PNorm = 103.4355, GNorm = 1.3637, lr_0 = 1.2696e-04\n",
      "Loss = 3.6927e-01, PNorm = 103.4467, GNorm = 2.3235, lr_0 = 1.2564e-04\n",
      "Loss = 3.8944e-01, PNorm = 103.4571, GNorm = 1.8026, lr_0 = 1.2434e-04\n",
      "Loss = 3.8420e-01, PNorm = 103.4687, GNorm = 1.6287, lr_0 = 1.2305e-04\n",
      "Validation prc-auc = 0.731557\n",
      " 90%|████████▉ | 44/49 [09:10<01:02, 12.54s/it]Epoch 44\n",
      "Loss = 3.5538e-01, PNorm = 103.4799, GNorm = 2.2236, lr_0 = 1.2165e-04\n",
      "Loss = 3.3368e-01, PNorm = 103.4906, GNorm = 2.1795, lr_0 = 1.2039e-04\n",
      "Loss = 3.9180e-01, PNorm = 103.4997, GNorm = 2.1030, lr_0 = 1.1914e-04\n",
      "Loss = 3.5748e-01, PNorm = 103.5107, GNorm = 1.3978, lr_0 = 1.1790e-04\n",
      "Loss = 3.7379e-01, PNorm = 103.5203, GNorm = 1.9116, lr_0 = 1.1668e-04\n",
      "Validation prc-auc = 0.722937\n",
      " 92%|█████████▏| 45/49 [09:22<00:50, 12.52s/it]Epoch 45\n",
      "Loss = 3.6534e-01, PNorm = 103.5314, GNorm = 2.0698, lr_0 = 1.1547e-04\n",
      "Loss = 3.5860e-01, PNorm = 103.5417, GNorm = 2.5266, lr_0 = 1.1427e-04\n",
      "Loss = 3.4249e-01, PNorm = 103.5502, GNorm = 2.0074, lr_0 = 1.1309e-04\n",
      "Loss = 3.8670e-01, PNorm = 103.5614, GNorm = 2.2272, lr_0 = 1.1192e-04\n",
      "Loss = 4.4395e-01, PNorm = 103.5698, GNorm = 3.2936, lr_0 = 1.1076e-04\n",
      "Validation prc-auc = 0.731044\n",
      " 94%|█████████▍| 46/49 [09:35<00:37, 12.55s/it]Epoch 46\n",
      "Loss = 3.5897e-01, PNorm = 103.5800, GNorm = 1.6338, lr_0 = 1.0961e-04\n",
      "Loss = 3.2715e-01, PNorm = 103.5895, GNorm = 1.2976, lr_0 = 1.0847e-04\n",
      "Loss = 3.4290e-01, PNorm = 103.5986, GNorm = 1.9580, lr_0 = 1.0735e-04\n",
      "Loss = 3.4036e-01, PNorm = 103.6072, GNorm = 1.4277, lr_0 = 1.0623e-04\n",
      "Loss = 4.3518e-01, PNorm = 103.6140, GNorm = 2.1300, lr_0 = 1.0513e-04\n",
      "Validation prc-auc = 0.731099\n",
      " 96%|█████████▌| 47/49 [09:48<00:25, 12.52s/it]Epoch 47\n",
      "Loss = 3.6067e-01, PNorm = 103.6237, GNorm = 1.7237, lr_0 = 1.0393e-04\n",
      "Loss = 3.7243e-01, PNorm = 103.6312, GNorm = 1.5077, lr_0 = 1.0285e-04\n",
      "Loss = 3.9727e-01, PNorm = 103.6384, GNorm = 1.3241, lr_0 = 1.0179e-04\n",
      "Loss = 3.4225e-01, PNorm = 103.6475, GNorm = 0.9065, lr_0 = 1.0073e-04\n",
      "Validation prc-auc = 0.733490\n",
      " 98%|█████████▊| 48/49 [10:00<00:12, 12.55s/it]Epoch 48\n",
      "Loss = 3.6779e-01, PNorm = 103.6554, GNorm = 2.3459, lr_0 = 1.0000e-04\n",
      "Loss = 3.6082e-01, PNorm = 103.6636, GNorm = 1.3462, lr_0 = 1.0000e-04\n",
      "Loss = 3.7138e-01, PNorm = 103.6726, GNorm = 1.9617, lr_0 = 1.0000e-04\n",
      "Loss = 3.5044e-01, PNorm = 103.6815, GNorm = 1.5092, lr_0 = 1.0000e-04\n",
      "Loss = 3.6957e-01, PNorm = 103.6885, GNorm = 2.6978, lr_0 = 1.0000e-04\n",
      "Validation prc-auc = 0.733983\n",
      "100%|██████████| 49/49 [10:13<00:00, 12.51s/it]\n",
      "Model 0 best validation prc-auc = 0.741242 on epoch 33\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"ffn.1.weight\".\n",
      "Loading pretrained parameter \"ffn.1.bias\".\n",
      "Loading pretrained parameter \"ffn.4.weight\".\n",
      "Loading pretrained parameter \"ffn.4.bias\".\n",
      "Loading pretrained parameter \"ffn.7.weight\".\n",
      "Loading pretrained parameter \"ffn.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test prc-auc = 0.741242                \n",
      "Ensemble test prc-auc = 0.741242\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test prc-auc = 0.741242\n",
      "Overall test prc-auc = 0.741242 +/- 0.000000\n",
      "Elapsed time = 0:10:16\n",
      "Command line\n",
      "python /home/steshin/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/ipykernel_launcher.py --ip=127.0.0.1 --stdin=9013 --control=9011 --hb=9010 --Session.signature_scheme=\"hmac-sha256\" --Session.key=b\"6c604d94-190d-4da2-9c36-788708df5377\" --shell=9012 --transport=\"tcp\" --iopub=9014 --f=/home/steshin/.local/share/jupyter/runtime/kernel-v2-2822374BRuswu5zWdXq.json\n",
      "Args\n",
      "{'activation': 'ReLU',\n",
      " 'adding_h': False,\n",
      " 'aggregation': 'mean',\n",
      " 'aggregation_norm': 100,\n",
      " 'atom_descriptor_scaling': True,\n",
      " 'atom_descriptors': None,\n",
      " 'atom_descriptors_path': None,\n",
      " 'atom_descriptors_size': 0,\n",
      " 'atom_features_size': 0,\n",
      " 'atom_messages': False,\n",
      " 'batch_size': 50,\n",
      " 'bias': False,\n",
      " 'bias_solvent': False,\n",
      " 'bond_feature_scaling': True,\n",
      " 'bond_features_path': None,\n",
      " 'bond_features_size': 0,\n",
      " 'cache_cutoff': 10000,\n",
      " 'checkpoint_dir': None,\n",
      " 'checkpoint_frzn': None,\n",
      " 'checkpoint_path': None,\n",
      " 'checkpoint_paths': None,\n",
      " 'class_balance': False,\n",
      " 'config_path': None,\n",
      " 'crossval_index_dir': None,\n",
      " 'crossval_index_file': None,\n",
      " 'crossval_index_sets': None,\n",
      " 'cuda': True,\n",
      " 'data_path': '/tmp/chemprop/train_1.csv',\n",
      " 'data_weights_path': None,\n",
      " 'dataset_type': 'classification',\n",
      " 'depth': 5,\n",
      " 'depth_solvent': 3,\n",
      " 'device': device(type='cuda', index=1),\n",
      " 'dropout': 0.7,\n",
      " 'empty_cache': False,\n",
      " 'ensemble_size': 1,\n",
      " 'epochs': 49,\n",
      " 'evidential_regularization': 0,\n",
      " 'explicit_h': False,\n",
      " 'extra_metrics': [],\n",
      " 'features_generator': None,\n",
      " 'features_only': False,\n",
      " 'features_path': None,\n",
      " 'features_scaling': True,\n",
      " 'features_size': None,\n",
      " 'ffn_hidden_size': 600,\n",
      " 'ffn_num_layers': 3,\n",
      " 'final_lr': 0.0001,\n",
      " 'folds_file': None,\n",
      " 'freeze_first_only': False,\n",
      " 'frzn_ffn_layers': 0,\n",
      " 'gpu': 1,\n",
      " 'grad_clip': None,\n",
      " 'hidden_size': 3600,\n",
      " 'hidden_size_solvent': 300,\n",
      " 'ignore_columns': None,\n",
      " 'init_lr': 0.0001,\n",
      " 'log_frequency': 10,\n",
      " 'loss_function': 'binary_cross_entropy',\n",
      " 'max_data_size': None,\n",
      " 'max_lr': 0.001,\n",
      " 'metric': 'prc-auc',\n",
      " 'metrics': ['prc-auc'],\n",
      " 'minimize_score': False,\n",
      " 'mpn_shared': False,\n",
      " 'multiclass_num_classes': 3,\n",
      " 'no_atom_descriptor_scaling': False,\n",
      " 'no_bond_features_scaling': False,\n",
      " 'no_cache_mol': False,\n",
      " 'no_cuda': False,\n",
      " 'no_features_scaling': False,\n",
      " 'num_folds': 1,\n",
      " 'num_lrs': 1,\n",
      " 'num_tasks': 1,\n",
      " 'num_workers': 8,\n",
      " 'number_of_molecules': 1,\n",
      " 'overwrite_default_atom_features': False,\n",
      " 'overwrite_default_bond_features': False,\n",
      " 'phase_features_path': None,\n",
      " 'pytorch_seed': 0,\n",
      " 'quiet': False,\n",
      " 'reaction': False,\n",
      " 'reaction_mode': 'reac_diff',\n",
      " 'reaction_solvent': False,\n",
      " 'resume_experiment': False,\n",
      " 'save_dir': '/tmp/chemprop/checkpoint',\n",
      " 'save_preds': True,\n",
      " 'save_smiles_splits': False,\n",
      " 'seed': 0,\n",
      " 'separate_test_atom_descriptors_path': None,\n",
      " 'separate_test_bond_features_path': None,\n",
      " 'separate_test_features_path': None,\n",
      " 'separate_test_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_test_phase_features_path': None,\n",
      " 'separate_val_atom_descriptors_path': None,\n",
      " 'separate_val_bond_features_path': None,\n",
      " 'separate_val_features_path': None,\n",
      " 'separate_val_path': '/tmp/chemprop/test_1.csv',\n",
      " 'separate_val_phase_features_path': None,\n",
      " 'show_individual_scores': False,\n",
      " 'smiles_columns': ['smiles'],\n",
      " 'spectra_activation': 'exp',\n",
      " 'spectra_phase_mask_path': None,\n",
      " 'spectra_target_floor': 1e-08,\n",
      " 'split_key_molecule': 0,\n",
      " 'split_sizes': [1.0, 0.0, 0.0],\n",
      " 'split_type': 'random',\n",
      " 'target_columns': None,\n",
      " 'target_weights': None,\n",
      " 'task_names': ['targets'],\n",
      " 'test': False,\n",
      " 'test_fold_index': None,\n",
      " 'train_data_size': None,\n",
      " 'undirected': False,\n",
      " 'use_input_features': False,\n",
      " 'val_fold_index': None,\n",
      " 'warmup_epochs': 2.0}\n",
      "Setting molecule featurization parameters to default.\n",
      "Loading data\n",
      "2385it [00:00, 401324.52it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 333547.23it/s]\n",
      "100%|██████████| 2385/2385 [00:00<00:00, 169357.09it/s]\n",
      "Number of tasks = 1\n",
      "Fold 0\n",
      "Splitting data with seed 0\n",
      "1190it [00:00, 436257.47it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 333637.82it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 191102.76it/s]\n",
      "1190it [00:00, 459935.66it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 337655.38it/s]\n",
      "100%|██████████| 1190/1190 [00:00<00:00, 200370.20it/s]\n",
      "Class sizes\n",
      "targets 0: 29.39%, 1: 70.61%\n",
      "Total size = 2,385 | train size = 2,385 | val size = 1,190 | test size = 1,190\n",
      "Building model 0\n",
      "MoleculeModel(\n",
      "  (sigmoid): Sigmoid()\n",
      "  (encoder): MPN(\n",
      "    (encoder): ModuleList(\n",
      "      (0): MPNEncoder(\n",
      "        (dropout_layer): Dropout(p=0.7, inplace=False)\n",
      "        (act_func): ReLU()\n",
      "        (W_i): Linear(in_features=147, out_features=3600, bias=False)\n",
      "        (W_h): Linear(in_features=3600, out_features=3600, bias=False)\n",
      "        (W_o): Linear(in_features=3733, out_features=3600, bias=True)\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (ffn): Sequential(\n",
      "    (0): Dropout(p=0.7, inplace=False)\n",
      "    (1): Linear(in_features=3600, out_features=600, bias=True)\n",
      "    (2): ReLU()\n",
      "    (3): Dropout(p=0.7, inplace=False)\n",
      "    (4): Linear(in_features=600, out_features=600, bias=True)\n",
      "    (5): ReLU()\n",
      "    (6): Dropout(p=0.7, inplace=False)\n",
      "    (7): Linear(in_features=600, out_features=1, bias=True)\n",
      "  )\n",
      ")\n",
      "Number of parameters = 29,457,001\n",
      "Moving model to cuda\n",
      "  0%|          | 0/49 [00:00<?, ?it/s]Epoch 0\n",
      "Loss = 1.0067e+00, PNorm = 95.8215, GNorm = 11.3097, lr_0 = 2.0532e-04\n",
      "Loss = 8.2540e-01, PNorm = 95.8920, GNorm = 4.7372, lr_0 = 3.0106e-04\n",
      "Loss = 6.7640e-01, PNorm = 95.9742, GNorm = 3.5823, lr_0 = 3.9681e-04\n",
      "Loss = 6.1312e-01, PNorm = 96.0487, GNorm = 2.5055, lr_0 = 4.9255e-04\n",
      "Validation prc-auc = 0.615862\n",
      "  2%|▏         | 1/49 [00:12<10:06, 12.63s/it]Epoch 1\n",
      "Loss = 6.1991e-01, PNorm = 96.1183, GNorm = 2.2756, lr_0 = 5.9787e-04\n",
      "Loss = 6.4763e-01, PNorm = 96.1786, GNorm = 2.1096, lr_0 = 6.9362e-04\n",
      "Loss = 6.4850e-01, PNorm = 96.2327, GNorm = 2.1754, lr_0 = 7.8936e-04\n",
      "Loss = 6.1910e-01, PNorm = 96.2873, GNorm = 1.6985, lr_0 = 8.8511e-04\n",
      "Loss = 6.2604e-01, PNorm = 96.3436, GNorm = 1.7381, lr_0 = 9.8085e-04\n",
      "Validation prc-auc = 0.629335\n",
      "  4%|▍         | 2/49 [00:25<10:06, 12.91s/it]Epoch 2\n",
      "Loss = 6.2445e-01, PNorm = 96.4006, GNorm = 1.5906, lr_0 = 9.9170e-04\n",
      "Loss = 6.0673e-01, PNorm = 96.4588, GNorm = 1.5449, lr_0 = 9.8141e-04\n",
      "Loss = 6.5753e-01, PNorm = 96.5077, GNorm = 1.1993, lr_0 = 9.7124e-04\n",
      "Loss = 6.1372e-01, PNorm = 96.5569, GNorm = 1.1501, lr_0 = 9.6116e-04\n",
      "Loss = 5.8741e-01, PNorm = 96.5987, GNorm = 1.5248, lr_0 = 9.5120e-04\n",
      "Validation prc-auc = 0.635690\n",
      "  6%|▌         | 3/49 [00:38<09:49, 12.82s/it]Epoch 3\n",
      "Loss = 6.1903e-01, PNorm = 96.6363, GNorm = 1.1153, lr_0 = 9.4133e-04\n",
      "Loss = 5.9095e-01, PNorm = 96.6750, GNorm = 1.1666, lr_0 = 9.3157e-04\n",
      "Loss = 6.3447e-01, PNorm = 96.7094, GNorm = 1.1577, lr_0 = 9.2191e-04\n",
      "Loss = 6.0546e-01, PNorm = 96.7454, GNorm = 1.1495, lr_0 = 9.1235e-04\n",
      "Loss = 6.1925e-01, PNorm = 96.7774, GNorm = 1.0267, lr_0 = 9.0289e-04\n",
      "Loss = 5.3680e-01, PNorm = 96.7807, GNorm = 1.1632, lr_0 = 9.0195e-04\n",
      "Validation prc-auc = 0.641041\n",
      "  8%|▊         | 4/49 [00:51<09:32, 12.73s/it]Epoch 4\n",
      "Loss = 6.1236e-01, PNorm = 96.8128, GNorm = 0.9591, lr_0 = 8.9260e-04\n",
      "Loss = 5.9317e-01, PNorm = 96.8448, GNorm = 1.0099, lr_0 = 8.8334e-04\n",
      "Loss = 5.9902e-01, PNorm = 96.8771, GNorm = 1.0602, lr_0 = 8.7418e-04\n",
      "Loss = 6.0361e-01, PNorm = 96.9112, GNorm = 1.0944, lr_0 = 8.6512e-04\n",
      "Validation prc-auc = 0.660186\n",
      " 10%|█         | 5/49 [01:03<09:16, 12.66s/it]Epoch 5\n",
      "Loss = 5.9755e-01, PNorm = 96.9443, GNorm = 0.9007, lr_0 = 8.5615e-04\n",
      "Loss = 6.1481e-01, PNorm = 96.9818, GNorm = 0.9244, lr_0 = 8.4727e-04\n",
      "Loss = 5.8683e-01, PNorm = 97.0160, GNorm = 1.0581, lr_0 = 8.3848e-04\n",
      "Loss = 6.0921e-01, PNorm = 97.0481, GNorm = 1.1509, lr_0 = 8.2979e-04\n",
      "Loss = 5.9022e-01, PNorm = 97.0812, GNorm = 1.1127, lr_0 = 8.2118e-04\n",
      "Validation prc-auc = 0.651851\n",
      " 12%|█▏        | 6/49 [01:16<09:03, 12.64s/it]Epoch 6\n",
      "Loss = 5.7595e-01, PNorm = 97.1133, GNorm = 0.9377, lr_0 = 8.1267e-04\n",
      "Loss = 6.1230e-01, PNorm = 97.1476, GNorm = 1.0435, lr_0 = 8.0424e-04\n",
      "Loss = 6.2784e-01, PNorm = 97.1783, GNorm = 0.8401, lr_0 = 7.9590e-04\n",
      "Loss = 5.8118e-01, PNorm = 97.2112, GNorm = 1.2101, lr_0 = 7.8765e-04\n",
      "Loss = 5.9307e-01, PNorm = 97.2455, GNorm = 0.8913, lr_0 = 7.7948e-04\n",
      "Validation prc-auc = 0.655969\n",
      " 14%|█▍        | 7/49 [01:28<08:52, 12.68s/it]Epoch 7\n",
      "Loss = 6.4780e-01, PNorm = 97.2792, GNorm = 1.0028, lr_0 = 7.7060e-04\n",
      "Loss = 6.0253e-01, PNorm = 97.3069, GNorm = 0.7932, lr_0 = 7.6261e-04\n",
      "Loss = 5.9209e-01, PNorm = 97.3315, GNorm = 1.2744, lr_0 = 7.5470e-04\n",
      "Loss = 5.9137e-01, PNorm = 97.3523, GNorm = 0.8005, lr_0 = 7.4687e-04\n",
      "Loss = 6.1059e-01, PNorm = 97.3749, GNorm = 0.8399, lr_0 = 7.3913e-04\n",
      "Validation prc-auc = 0.664513\n",
      " 16%|█▋        | 8/49 [01:41<08:39, 12.67s/it]Epoch 8\n",
      "Loss = 5.5741e-01, PNorm = 97.3986, GNorm = 0.8739, lr_0 = 7.3146e-04\n",
      "Loss = 6.2573e-01, PNorm = 97.4220, GNorm = 0.7532, lr_0 = 7.2388e-04\n",
      "Loss = 5.9088e-01, PNorm = 97.4468, GNorm = 1.2770, lr_0 = 7.1637e-04\n",
      "Loss = 5.9256e-01, PNorm = 97.4694, GNorm = 0.7629, lr_0 = 7.0894e-04\n",
      "Validation prc-auc = 0.672864\n",
      " 18%|█▊        | 9/49 [01:54<08:25, 12.65s/it]Epoch 9\n",
      "Loss = 6.5881e-01, PNorm = 97.4916, GNorm = 0.8419, lr_0 = 7.0159e-04\n",
      "Loss = 5.8727e-01, PNorm = 97.5139, GNorm = 0.7291, lr_0 = 6.9432e-04\n",
      "Loss = 5.8728e-01, PNorm = 97.5374, GNorm = 1.0385, lr_0 = 6.8712e-04\n",
      "Loss = 5.8502e-01, PNorm = 97.5633, GNorm = 1.0428, lr_0 = 6.7999e-04\n",
      "Loss = 6.2082e-01, PNorm = 97.5899, GNorm = 0.7921, lr_0 = 6.7294e-04\n",
      "Validation prc-auc = 0.673715\n",
      " 20%|██        | 10/49 [02:06<08:12, 12.63s/it]Epoch 10\n",
      "Loss = 5.7459e-01, PNorm = 97.6175, GNorm = 1.3166, lr_0 = 6.6596e-04\n",
      "Loss = 5.6504e-01, PNorm = 97.6417, GNorm = 0.7604, lr_0 = 6.5906e-04\n",
      "Loss = 5.5505e-01, PNorm = 97.6662, GNorm = 0.7163, lr_0 = 6.5222e-04\n",
      "Loss = 5.8819e-01, PNorm = 97.6906, GNorm = 1.0963, lr_0 = 6.4546e-04\n",
      "Loss = 5.9150e-01, PNorm = 97.7150, GNorm = 0.7214, lr_0 = 6.3877e-04\n",
      "Validation prc-auc = 0.688644\n",
      " 22%|██▏       | 11/49 [02:19<07:59, 12.62s/it]Epoch 11\n",
      "Loss = 5.8862e-01, PNorm = 97.7485, GNorm = 0.7999, lr_0 = 6.3148e-04\n",
      "Loss = 5.8824e-01, PNorm = 97.7823, GNorm = 0.8205, lr_0 = 6.2494e-04\n",
      "Loss = 5.3623e-01, PNorm = 97.8175, GNorm = 0.8394, lr_0 = 6.1846e-04\n",
      "Loss = 5.8235e-01, PNorm = 97.8538, GNorm = 0.7945, lr_0 = 6.1204e-04\n",
      "Loss = 5.7764e-01, PNorm = 97.8898, GNorm = 0.8961, lr_0 = 6.0570e-04\n",
      "Validation prc-auc = 0.679210\n",
      " 24%|██▍       | 12/49 [02:32<07:48, 12.67s/it]Epoch 12\n",
      "Loss = 5.7526e-01, PNorm = 97.9272, GNorm = 0.8109, lr_0 = 5.9941e-04\n",
      "Loss = 5.9038e-01, PNorm = 97.9731, GNorm = 1.1532, lr_0 = 5.9320e-04\n",
      "Loss = 5.5518e-01, PNorm = 98.0209, GNorm = 0.8471, lr_0 = 5.8705e-04\n",
      "Loss = 5.5728e-01, PNorm = 98.0601, GNorm = 0.8460, lr_0 = 5.8096e-04\n",
      "Loss = 5.5681e-01, PNorm = 98.0981, GNorm = 0.8468, lr_0 = 5.7494e-04\n",
      "Validation prc-auc = 0.688309\n",
      " 27%|██▋       | 13/49 [02:44<07:33, 12.61s/it]Epoch 13\n",
      "Loss = 5.6598e-01, PNorm = 98.1387, GNorm = 0.8266, lr_0 = 5.6897e-04\n",
      "Loss = 5.3870e-01, PNorm = 98.1848, GNorm = 0.9767, lr_0 = 5.6307e-04\n",
      "Loss = 5.4043e-01, PNorm = 98.2379, GNorm = 1.1197, lr_0 = 5.5724e-04\n",
      "Loss = 5.4619e-01, PNorm = 98.2980, GNorm = 0.8256, lr_0 = 5.5146e-04\n",
      "Validation prc-auc = 0.699077\n",
      " 29%|██▊       | 14/49 [02:57<07:21, 12.61s/it]Epoch 14\n",
      "Loss = 5.3569e-01, PNorm = 98.3714, GNorm = 0.8903, lr_0 = 5.4517e-04\n",
      "Loss = 5.6463e-01, PNorm = 98.4409, GNorm = 1.2626, lr_0 = 5.3952e-04\n",
      "Loss = 5.4523e-01, PNorm = 98.5052, GNorm = 1.1145, lr_0 = 5.3392e-04\n",
      "Loss = 5.6643e-01, PNorm = 98.5639, GNorm = 0.9076, lr_0 = 5.2839e-04\n",
      "Loss = 5.5523e-01, PNorm = 98.6153, GNorm = 0.7693, lr_0 = 5.2291e-04\n",
      "Validation prc-auc = 0.691737\n",
      " 31%|███       | 15/49 [03:09<07:07, 12.57s/it]Epoch 15\n",
      "Loss = 5.3118e-01, PNorm = 98.6636, GNorm = 0.9687, lr_0 = 5.1748e-04\n",
      "Loss = 5.3933e-01, PNorm = 98.7119, GNorm = 0.8625, lr_0 = 5.1212e-04\n",
      "Loss = 5.4049e-01, PNorm = 98.7619, GNorm = 0.8584, lr_0 = 5.0681e-04\n",
      "Loss = 5.4891e-01, PNorm = 98.8204, GNorm = 0.8701, lr_0 = 5.0155e-04\n",
      "Loss = 6.0999e-01, PNorm = 98.8840, GNorm = 1.5771, lr_0 = 4.9635e-04\n",
      "Validation prc-auc = 0.698665\n",
      " 33%|███▎      | 16/49 [03:22<06:54, 12.55s/it]Epoch 16\n",
      "Loss = 5.5149e-01, PNorm = 98.9355, GNorm = 0.8400, lr_0 = 4.9121e-04\n",
      "Loss = 5.6923e-01, PNorm = 98.9801, GNorm = 0.8205, lr_0 = 4.8611e-04\n",
      "Loss = 5.0741e-01, PNorm = 99.0231, GNorm = 0.9529, lr_0 = 4.8107e-04\n",
      "Loss = 5.1714e-01, PNorm = 99.0660, GNorm = 1.3596, lr_0 = 4.7608e-04\n",
      "Loss = 5.4610e-01, PNorm = 99.1139, GNorm = 1.2540, lr_0 = 4.7115e-04\n",
      "Loss = 5.4559e-01, PNorm = 99.1190, GNorm = 1.1154, lr_0 = 4.7065e-04\n",
      "Validation prc-auc = 0.703012\n",
      " 35%|███▍      | 17/49 [03:34<06:42, 12.59s/it]Epoch 17\n",
      "Loss = 5.6096e-01, PNorm = 99.1730, GNorm = 0.8506, lr_0 = 4.6577e-04\n",
      "Loss = 4.6652e-01, PNorm = 99.2311, GNorm = 1.2833, lr_0 = 4.6094e-04\n",
      "Loss = 5.7133e-01, PNorm = 99.2952, GNorm = 1.4062, lr_0 = 4.5616e-04\n",
      "Loss = 5.1146e-01, PNorm = 99.3744, GNorm = 0.9661, lr_0 = 4.5143e-04\n",
      "Validation prc-auc = 0.702302\n",
      " 37%|███▋      | 18/49 [03:47<06:29, 12.56s/it]Epoch 18\n",
      "Loss = 4.5711e-01, PNorm = 99.4486, GNorm = 0.8978, lr_0 = 4.4675e-04\n",
      "Loss = 5.1450e-01, PNorm = 99.5158, GNorm = 1.0773, lr_0 = 4.4212e-04\n",
      "Loss = 5.4205e-01, PNorm = 99.5852, GNorm = 0.9560, lr_0 = 4.3754e-04\n",
      "Loss = 5.7246e-01, PNorm = 99.6483, GNorm = 1.1926, lr_0 = 4.3300e-04\n",
      "Loss = 4.6836e-01, PNorm = 99.7024, GNorm = 0.8893, lr_0 = 4.2851e-04\n",
      "Validation prc-auc = 0.715082\n",
      " 39%|███▉      | 19/49 [04:00<06:19, 12.66s/it]Epoch 19\n",
      "Loss = 4.8704e-01, PNorm = 99.7477, GNorm = 0.8783, lr_0 = 4.2407e-04\n",
      "Loss = 4.9577e-01, PNorm = 99.7995, GNorm = 1.4950, lr_0 = 4.1967e-04\n",
      "Loss = 5.3146e-01, PNorm = 99.8667, GNorm = 1.1820, lr_0 = 4.1532e-04\n",
      "Loss = 5.1071e-01, PNorm = 99.9379, GNorm = 1.1795, lr_0 = 4.1101e-04\n",
      "Loss = 5.0250e-01, PNorm = 100.0001, GNorm = 1.0708, lr_0 = 4.0675e-04\n",
      "Validation prc-auc = 0.713267\n",
      " 41%|████      | 20/49 [04:12<06:05, 12.62s/it]Epoch 20\n",
      "Loss = 5.1530e-01, PNorm = 100.0550, GNorm = 2.5589, lr_0 = 4.0253e-04\n",
      "Loss = 4.7558e-01, PNorm = 100.1062, GNorm = 0.8899, lr_0 = 3.9836e-04\n",
      "Loss = 5.1477e-01, PNorm = 100.1580, GNorm = 1.3610, lr_0 = 3.9423e-04\n",
      "Loss = 4.8478e-01, PNorm = 100.2147, GNorm = 0.9908, lr_0 = 3.9014e-04\n",
      "Loss = 5.1785e-01, PNorm = 100.2678, GNorm = 1.3075, lr_0 = 3.8609e-04\n",
      "Validation prc-auc = 0.697765\n",
      " 43%|████▎     | 21/49 [04:25<05:51, 12.56s/it]Epoch 21\n",
      "Loss = 4.8804e-01, PNorm = 100.3286, GNorm = 1.9389, lr_0 = 3.8169e-04\n",
      "Loss = 4.4829e-01, PNorm = 100.3923, GNorm = 0.9990, lr_0 = 3.7773e-04\n",
      "Loss = 5.3973e-01, PNorm = 100.4597, GNorm = 1.1261, lr_0 = 3.7382e-04\n",
      "Loss = 4.5359e-01, PNorm = 100.5230, GNorm = 1.4720, lr_0 = 3.6994e-04\n",
      "Validation prc-auc = 0.730478\n",
      " 45%|████▍     | 22/49 [04:37<05:40, 12.60s/it]Epoch 22\n",
      "Loss = 5.0334e-01, PNorm = 100.5881, GNorm = 1.4204, lr_0 = 3.6610e-04\n",
      "Loss = 5.2330e-01, PNorm = 100.6420, GNorm = 1.1426, lr_0 = 3.6231e-04\n",
      "Loss = 4.4600e-01, PNorm = 100.6945, GNorm = 1.3572, lr_0 = 3.5855e-04\n",
      "Loss = 4.6355e-01, PNorm = 100.7440, GNorm = 1.0567, lr_0 = 3.5483e-04\n",
      "Loss = 5.2424e-01, PNorm = 100.7986, GNorm = 1.2341, lr_0 = 3.5115e-04\n",
      "Validation prc-auc = 0.710172\n",
      " 47%|████▋     | 23/49 [04:50<05:26, 12.57s/it]Epoch 23\n",
      "Loss = 4.8506e-01, PNorm = 100.8470, GNorm = 1.5420, lr_0 = 3.4751e-04\n",
      "Loss = 4.8682e-01, PNorm = 100.8904, GNorm = 0.9928, lr_0 = 3.4391e-04\n",
      "Loss = 4.5869e-01, PNorm = 100.9296, GNorm = 2.0953, lr_0 = 3.4034e-04\n",
      "Loss = 5.0980e-01, PNorm = 100.9674, GNorm = 1.1891, lr_0 = 3.3681e-04\n",
      "Loss = 4.5286e-01, PNorm = 101.0165, GNorm = 0.9336, lr_0 = 3.3332e-04\n",
      "Validation prc-auc = 0.728259\n",
      " 49%|████▉     | 24/49 [05:03<05:17, 12.72s/it]Epoch 24\n",
      "Loss = 4.8516e-01, PNorm = 101.0666, GNorm = 1.8970, lr_0 = 3.2952e-04\n",
      "Loss = 4.8621e-01, PNorm = 101.1131, GNorm = 1.4264, lr_0 = 3.2610e-04\n",
      "Loss = 4.3167e-01, PNorm = 101.1564, GNorm = 1.1878, lr_0 = 3.2272e-04\n",
      "Loss = 4.2437e-01, PNorm = 101.2023, GNorm = 2.7617, lr_0 = 3.1937e-04\n",
      "Loss = 4.8904e-01, PNorm = 101.2491, GNorm = 1.7485, lr_0 = 3.1606e-04\n",
      "Validation prc-auc = 0.733935\n",
      " 51%|█████     | 25/49 [05:16<05:04, 12.69s/it]Epoch 25\n",
      "Loss = 5.2475e-01, PNorm = 101.2964, GNorm = 2.3993, lr_0 = 3.1279e-04\n",
      "Loss = 4.6621e-01, PNorm = 101.3451, GNorm = 1.2041, lr_0 = 3.0954e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.3867, GNorm = 1.1062, lr_0 = 3.0633e-04\n",
      "Loss = 4.7162e-01, PNorm = 101.4270, GNorm = 1.3346, lr_0 = 3.0316e-04\n",
      "Loss = 4.3106e-01, PNorm = 101.4674, GNorm = 1.6084, lr_0 = 3.0001e-04\n",
      "Validation prc-auc = 0.729222\n",
      " 53%|█████▎    | 26/49 [05:28<04:50, 12.65s/it]Epoch 26\n",
      "Loss = 4.3461e-01, PNorm = 101.5064, GNorm = 1.1614, lr_0 = 2.9690e-04\n",
      "Loss = 4.8308e-01, PNorm = 101.5477, GNorm = 2.9387, lr_0 = 2.9382e-04\n",
      "Loss = 4.4844e-01, PNorm = 101.5879, GNorm = 1.3525, lr_0 = 2.9078e-04\n",
      "Loss = 4.5905e-01, PNorm = 101.6276, GNorm = 1.7554, lr_0 = 2.8776e-04\n",
      "Validation prc-auc = 0.723556\n",
      " 55%|█████▌    | 27/49 [05:41<04:36, 12.57s/it]Epoch 27\n",
      "Loss = 3.8075e-01, PNorm = 101.6739, GNorm = 1.2324, lr_0 = 2.8448e-04\n",
      "Loss = 4.4958e-01, PNorm = 101.7146, GNorm = 1.6542, lr_0 = 2.8153e-04\n",
      "Loss = 4.4140e-01, PNorm = 101.7589, GNorm = 1.4257, lr_0 = 2.7861e-04\n",
      "Loss = 4.2466e-01, PNorm = 101.8007, GNorm = 1.7038, lr_0 = 2.7572e-04\n",
      "Loss = 4.7970e-01, PNorm = 101.8378, GNorm = 1.3090, lr_0 = 2.7286e-04\n",
      "Validation prc-auc = 0.707338\n",
      " 57%|█████▋    | 28/49 [05:53<04:24, 12.57s/it]Epoch 28\n",
      "Loss = 4.5278e-01, PNorm = 101.8740, GNorm = 1.3734, lr_0 = 2.7003e-04\n",
      "Loss = 4.5094e-01, PNorm = 101.9079, GNorm = 1.0547, lr_0 = 2.6723e-04\n",
      "Loss = 4.1357e-01, PNorm = 101.9411, GNorm = 1.5816, lr_0 = 2.6446e-04\n",
      "Loss = 4.6498e-01, PNorm = 101.9734, GNorm = 1.8609, lr_0 = 2.6172e-04\n",
      "Loss = 4.2933e-01, PNorm = 102.0062, GNorm = 1.0863, lr_0 = 2.5901e-04\n",
      "Validation prc-auc = 0.699879\n",
      " 59%|█████▉    | 29/49 [06:06<04:10, 12.53s/it]Epoch 29\n",
      "Loss = 3.9687e-01, PNorm = 102.0364, GNorm = 1.0911, lr_0 = 2.5632e-04\n",
      "Loss = 3.9953e-01, PNorm = 102.0640, GNorm = 1.2628, lr_0 = 2.5366e-04\n",
      "Loss = 4.5717e-01, PNorm = 102.0935, GNorm = 1.8129, lr_0 = 2.5103e-04\n",
      "Loss = 4.1537e-01, PNorm = 102.1263, GNorm = 1.2622, lr_0 = 2.4843e-04\n",
      "Loss = 4.6298e-01, PNorm = 102.1587, GNorm = 1.6679, lr_0 = 2.4585e-04\n",
      "Validation prc-auc = 0.729581\n",
      " 61%|██████    | 30/49 [06:18<03:59, 12.58s/it]Epoch 30\n",
      "Loss = 4.4116e-01, PNorm = 102.1918, GNorm = 2.3824, lr_0 = 2.4330e-04\n",
      "Loss = 4.4225e-01, PNorm = 102.2200, GNorm = 2.0057, lr_0 = 2.4078e-04\n",
      "Loss = 4.1512e-01, PNorm = 102.2495, GNorm = 1.2579, lr_0 = 2.3828e-04\n",
      "Loss = 4.3965e-01, PNorm = 102.2783, GNorm = 1.9444, lr_0 = 2.3581e-04\n",
      "Validation prc-auc = 0.721862\n",
      " 63%|██████▎   | 31/49 [06:31<03:45, 12.52s/it]Epoch 31\n",
      "Loss = 4.1521e-01, PNorm = 102.3138, GNorm = 2.0351, lr_0 = 2.3312e-04\n",
      "Loss = 4.6530e-01, PNorm = 102.3409, GNorm = 0.9553, lr_0 = 2.3071e-04\n",
      "Loss = 4.4350e-01, PNorm = 102.3687, GNorm = 1.5819, lr_0 = 2.2831e-04\n",
      "Loss = 4.1122e-01, PNorm = 102.3959, GNorm = 1.5397, lr_0 = 2.2595e-04\n",
      "Loss = 3.9777e-01, PNorm = 102.4228, GNorm = 0.9937, lr_0 = 2.2360e-04\n",
      "Validation prc-auc = 0.721970\n",
      " 65%|██████▌   | 32/49 [06:43<03:32, 12.50s/it]Epoch 32\n",
      "Loss = 4.3843e-01, PNorm = 102.4485, GNorm = 3.1887, lr_0 = 2.2129e-04\n",
      "Loss = 3.8235e-01, PNorm = 102.4765, GNorm = 1.1239, lr_0 = 2.1899e-04\n",
      "Loss = 4.2292e-01, PNorm = 102.5009, GNorm = 1.9876, lr_0 = 2.1672e-04\n",
      "Loss = 4.3276e-01, PNorm = 102.5277, GNorm = 1.5407, lr_0 = 2.1447e-04\n",
      "Loss = 4.6404e-01, PNorm = 102.5524, GNorm = 1.9581, lr_0 = 2.1225e-04\n",
      "Validation prc-auc = 0.704753\n",
      " 67%|██████▋   | 33/49 [06:56<03:21, 12.58s/it]Epoch 33\n",
      "Loss = 4.0377e-01, PNorm = 102.5779, GNorm = 1.4487, lr_0 = 2.1005e-04\n",
      "Loss = 4.3812e-01, PNorm = 102.6001, GNorm = 1.7061, lr_0 = 2.0787e-04\n",
      "Loss = 4.1834e-01, PNorm = 102.6218, GNorm = 1.3299, lr_0 = 2.0571e-04\n",
      "Loss = 4.0906e-01, PNorm = 102.6444, GNorm = 1.2884, lr_0 = 2.0358e-04\n",
      "Loss = 4.0979e-01, PNorm = 102.6662, GNorm = 1.7456, lr_0 = 2.0147e-04\n",
      "Validation prc-auc = 0.741242\n",
      " 69%|██████▉   | 34/49 [07:08<03:08, 12.59s/it]Epoch 34\n",
      "Loss = 4.2813e-01, PNorm = 102.6889, GNorm = 2.0504, lr_0 = 1.9917e-04\n",
      "Loss = 4.2911e-01, PNorm = 102.7107, GNorm = 2.0385, lr_0 = 1.9711e-04\n",
      "Loss = 4.0048e-01, PNorm = 102.7322, GNorm = 1.4560, lr_0 = 1.9506e-04\n",
      "Loss = 3.9704e-01, PNorm = 102.7581, GNorm = 1.1820, lr_0 = 1.9304e-04\n",
      "Validation prc-auc = 0.727587\n",
      " 71%|███████▏  | 35/49 [07:21<02:56, 12.63s/it]Epoch 35\n",
      "Loss = 3.3330e-01, PNorm = 102.7780, GNorm = 1.1825, lr_0 = 1.9104e-04\n",
      "Loss = 3.8412e-01, PNorm = 102.7992, GNorm = 1.7658, lr_0 = 1.8906e-04\n",
      "Loss = 3.7517e-01, PNorm = 102.8210, GNorm = 1.2284, lr_0 = 1.8710e-04\n",
      "Loss = 4.5571e-01, PNorm = 102.8433, GNorm = 2.2784, lr_0 = 1.8516e-04\n",
      "Loss = 3.8375e-01, PNorm = 102.8635, GNorm = 1.3376, lr_0 = 1.8324e-04\n",
      "Validation prc-auc = 0.724475\n",
      " 73%|███████▎  | 36/49 [07:34<02:43, 12.59s/it]Epoch 36\n",
      "Loss = 4.4192e-01, PNorm = 102.8839, GNorm = 1.9883, lr_0 = 1.8134e-04\n",
      "Loss = 3.9549e-01, PNorm = 102.9023, GNorm = 1.8302, lr_0 = 1.7946e-04\n",
      "Loss = 3.7269e-01, PNorm = 102.9189, GNorm = 1.2762, lr_0 = 1.7760e-04\n",
      "Loss = 4.3072e-01, PNorm = 102.9375, GNorm = 1.6168, lr_0 = 1.7575e-04\n",
      "Loss = 4.1462e-01, PNorm = 102.9576, GNorm = 1.4891, lr_0 = 1.7393e-04\n",
      "Validation prc-auc = 0.729879\n",
      " 76%|███████▌  | 37/49 [07:46<02:30, 12.56s/it]Epoch 37\n",
      "Loss = 3.9510e-01, PNorm = 102.9784, GNorm = 1.6406, lr_0 = 1.7195e-04\n",
      "Loss = 3.8523e-01, PNorm = 102.9971, GNorm = 3.6376, lr_0 = 1.7017e-04\n",
      "Loss = 4.0788e-01, PNorm = 103.0164, GNorm = 1.6742, lr_0 = 1.6840e-04\n",
      "Loss = 3.9008e-01, PNorm = 103.0370, GNorm = 1.3618, lr_0 = 1.6666e-04\n",
      "Loss = 3.6996e-01, PNorm = 103.0561, GNorm = 2.1714, lr_0 = 1.6493e-04\n",
      "Validation prc-auc = 0.732890\n",
      " 78%|███████▊  | 38/49 [07:59<02:18, 12.57s/it]Epoch 38\n",
      "Loss = 4.2739e-01, PNorm = 103.0759, GNorm = 2.0150, lr_0 = 1.6322e-04\n",
      "Loss = 3.7266e-01, PNorm = 103.0961, GNorm = 1.5987, lr_0 = 1.6152e-04\n",
      "Loss = 4.0328e-01, PNorm = 103.1141, GNorm = 1.2749, lr_0 = 1.5985e-04\n",
      "Loss = 4.0170e-01, PNorm = 103.1329, GNorm = 1.6032, lr_0 = 1.5819e-04\n",
      "Loss = 3.5034e-01, PNorm = 103.1500, GNorm = 1.2491, lr_0 = 1.5655e-04\n",
      "Validation prc-auc = 0.730448\n",
      " 80%|███████▉  | 39/49 [08:11<02:05, 12.54s/it]Epoch 39\n",
      "Loss = 4.0423e-01, PNorm = 103.1649, GNorm = 3.4590, lr_0 = 1.5493e-04\n",
      "Loss = 4.0749e-01, PNorm = 103.1823, GNorm = 2.6038, lr_0 = 1.5332e-04\n",
      "Loss = 3.7462e-01, PNorm = 103.1983, GNorm = 1.7902, lr_0 = 1.5173e-04\n",
      "Loss = 3.6832e-01, PNorm = 103.2140, GNorm = 2.0638, lr_0 = 1.5016e-04\n",
      "Validation prc-auc = 0.726064\n",
      " 82%|████████▏ | 40/49 [08:24<01:53, 12.63s/it]Epoch 40\n",
      "Loss = 3.8487e-01, PNorm = 103.2275, GNorm = 1.6070, lr_0 = 1.4860e-04\n",
      "Loss = 3.5290e-01, PNorm = 103.2421, GNorm = 2.4138, lr_0 = 1.4706e-04\n",
      "Loss = 4.0514e-01, PNorm = 103.2566, GNorm = 1.1793, lr_0 = 1.4554e-04\n",
      "Loss = 3.6971e-01, PNorm = 103.2715, GNorm = 1.2253, lr_0 = 1.4403e-04\n",
      "Loss = 4.0549e-01, PNorm = 103.2859, GNorm = 1.1838, lr_0 = 1.4253e-04\n",
      "Validation prc-auc = 0.728744\n",
      " 84%|████████▎ | 41/49 [08:37<01:40, 12.60s/it]Epoch 41\n",
      "Loss = 4.0692e-01, PNorm = 103.3017, GNorm = 2.3294, lr_0 = 1.4091e-04\n",
      "Loss = 3.6107e-01, PNorm = 103.3157, GNorm = 1.8161, lr_0 = 1.3945e-04\n",
      "Loss = 4.3158e-01, PNorm = 103.3296, GNorm = 2.0411, lr_0 = 1.3800e-04\n",
      "Loss = 3.8727e-01, PNorm = 103.3434, GNorm = 2.1048, lr_0 = 1.3657e-04\n",
      "Loss = 3.5917e-01, PNorm = 103.3583, GNorm = 0.9664, lr_0 = 1.3515e-04\n",
      "Validation prc-auc = 0.727437\n",
      " 86%|████████▌ | 42/49 [08:49<01:27, 12.57s/it]Epoch 42\n",
      "Loss = 4.1430e-01, PNorm = 103.3714, GNorm = 2.0484, lr_0 = 1.3375e-04\n",
      "Loss = 3.7543e-01, PNorm = 103.3872, GNorm = 2.0368, lr_0 = 1.3237e-04\n",
      "Loss = 4.2834e-01, PNorm = 103.4001, GNorm = 1.5786, lr_0 = 1.3099e-04\n",
      "Loss = 3.5447e-01, PNorm = 103.4133, GNorm = 1.7577, lr_0 = 1.2963e-04\n",
      "Loss = 3.9995e-01, PNorm = 103.4242, GNorm = 1.9164, lr_0 = 1.2829e-04\n",
      "Validation prc-auc = 0.734144\n",
      " 88%|████████▊ | 43/49 [09:02<01:15, 12.57s/it]Epoch 43\n",
      "Loss = 3.3649e-01, PNorm = 103.4355, GNorm = 1.3637, lr_0 = 1.2696e-04\n",
      "Loss = 3.6927e-01, PNorm = 103.4467, GNorm = 2.3235, lr_0 = 1.2564e-04\n",
      "Loss = 3.8944e-01, PNorm = 103.4571, GNorm = 1.8026, lr_0 = 1.2434e-04\n",
      "Loss = 3.8420e-01, PNorm = 103.4687, GNorm = 1.6287, lr_0 = 1.2305e-04\n",
      "Validation prc-auc = 0.731557\n",
      " 90%|████████▉ | 44/49 [09:14<01:03, 12.62s/it]Epoch 44\n",
      "Loss = 3.5538e-01, PNorm = 103.4799, GNorm = 2.2236, lr_0 = 1.2165e-04\n",
      "Loss = 3.3368e-01, PNorm = 103.4906, GNorm = 2.1795, lr_0 = 1.2039e-04\n",
      "Loss = 3.9180e-01, PNorm = 103.4997, GNorm = 2.1030, lr_0 = 1.1914e-04\n",
      "Loss = 3.5748e-01, PNorm = 103.5107, GNorm = 1.3978, lr_0 = 1.1790e-04\n",
      "Loss = 3.7379e-01, PNorm = 103.5203, GNorm = 1.9116, lr_0 = 1.1668e-04\n",
      "Validation prc-auc = 0.722937\n",
      " 92%|█████████▏| 45/49 [09:27<00:50, 12.65s/it]Epoch 45\n",
      "Loss = 3.6534e-01, PNorm = 103.5314, GNorm = 2.0698, lr_0 = 1.1547e-04\n",
      "Loss = 3.5860e-01, PNorm = 103.5417, GNorm = 2.5266, lr_0 = 1.1427e-04\n",
      "Loss = 3.4249e-01, PNorm = 103.5502, GNorm = 2.0074, lr_0 = 1.1309e-04\n",
      "Loss = 3.8670e-01, PNorm = 103.5614, GNorm = 2.2272, lr_0 = 1.1192e-04\n",
      "Loss = 4.4395e-01, PNorm = 103.5698, GNorm = 3.2936, lr_0 = 1.1076e-04\n",
      "Validation prc-auc = 0.731044\n",
      " 94%|█████████▍| 46/49 [09:40<00:37, 12.63s/it]Epoch 46\n",
      "Loss = 3.5897e-01, PNorm = 103.5800, GNorm = 1.6338, lr_0 = 1.0961e-04\n",
      "Loss = 3.2715e-01, PNorm = 103.5895, GNorm = 1.2976, lr_0 = 1.0847e-04\n",
      "Loss = 3.4290e-01, PNorm = 103.5986, GNorm = 1.9580, lr_0 = 1.0735e-04\n",
      "Loss = 3.4036e-01, PNorm = 103.6072, GNorm = 1.4277, lr_0 = 1.0623e-04\n",
      "Loss = 4.3518e-01, PNorm = 103.6140, GNorm = 2.1300, lr_0 = 1.0513e-04\n",
      "Validation prc-auc = 0.731099\n",
      " 96%|█████████▌| 47/49 [09:52<00:25, 12.63s/it]Epoch 47\n",
      "Loss = 3.6067e-01, PNorm = 103.6237, GNorm = 1.7237, lr_0 = 1.0393e-04\n",
      "Loss = 3.7243e-01, PNorm = 103.6312, GNorm = 1.5077, lr_0 = 1.0285e-04\n",
      "Loss = 3.9727e-01, PNorm = 103.6384, GNorm = 1.3241, lr_0 = 1.0179e-04\n",
      "Loss = 3.4225e-01, PNorm = 103.6475, GNorm = 0.9065, lr_0 = 1.0073e-04\n",
      "Validation prc-auc = 0.733490\n",
      " 98%|█████████▊| 48/49 [10:05<00:12, 12.63s/it]Epoch 48\n",
      "Loss = 3.6779e-01, PNorm = 103.6554, GNorm = 2.3459, lr_0 = 1.0000e-04\n",
      "Loss = 3.6082e-01, PNorm = 103.6636, GNorm = 1.3462, lr_0 = 1.0000e-04\n",
      "Loss = 3.7138e-01, PNorm = 103.6726, GNorm = 1.9617, lr_0 = 1.0000e-04\n",
      "Loss = 3.5044e-01, PNorm = 103.6815, GNorm = 1.5092, lr_0 = 1.0000e-04\n",
      "Loss = 3.6957e-01, PNorm = 103.6885, GNorm = 2.6978, lr_0 = 1.0000e-04\n",
      "Validation prc-auc = 0.733983\n",
      "100%|██████████| 49/49 [10:17<00:00, 12.61s/it]\n",
      "Model 0 best validation prc-auc = 0.741242 on epoch 33\n",
      "Loading pretrained parameter \"encoder.encoder.0.cached_zero_vector\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_i.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_h.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.weight\".\n",
      "Loading pretrained parameter \"encoder.encoder.0.W_o.bias\".\n",
      "Loading pretrained parameter \"ffn.1.weight\".\n",
      "Loading pretrained parameter \"ffn.1.bias\".\n",
      "Loading pretrained parameter \"ffn.4.weight\".\n",
      "Loading pretrained parameter \"ffn.4.bias\".\n",
      "Loading pretrained parameter \"ffn.7.weight\".\n",
      "Loading pretrained parameter \"ffn.7.bias\".\n",
      "Moving model to cuda\n",
      "Model 0 test prc-auc = 0.741242                \n",
      "Ensemble test prc-auc = 0.741242\n",
      "1-fold cross validation\n",
      "\tSeed 0 ==> test prc-auc = 0.741242\n",
      "Overall test prc-auc = 0.741242 +/- 0.000000\n",
      "Elapsed time = 0:10:21\n"
     ]
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "ename": "ValueError",
     "evalue": "Input contains NaN.",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[15], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m get_hi_metrics(test_result,test_result[\u001b[39m'\u001b[39;49m\u001b[39mpreds\u001b[39;49m\u001b[39m'\u001b[39;49m])\n",
      "File \u001b[0;32m/data/steshin/gero_benchmark/notebooks/models/hi/drd2/../../../../code/metrics.py:37\u001b[0m, in \u001b[0;36mget_hi_metrics\u001b[0;34m(data, y_pred)\u001b[0m\n\u001b[1;32m     35\u001b[0m y \u001b[39m=\u001b[39m data[\u001b[39m'\u001b[39m\u001b[39mvalue\u001b[39m\u001b[39m'\u001b[39m]\u001b[39m.\u001b[39mastype(\u001b[39mfloat\u001b[39m)\n\u001b[1;32m     36\u001b[0m y_prob \u001b[39m=\u001b[39m sigmoid(y_pred)\n\u001b[0;32m---> 37\u001b[0m roc_auc \u001b[39m=\u001b[39m roc_auc_score(y, y_prob)\n\u001b[1;32m     38\u001b[0m prc_auc \u001b[39m=\u001b[39m average_precision_score(y, y_prob)\n\u001b[1;32m     40\u001b[0m two_class_prob \u001b[39m=\u001b[39m np\u001b[39m.\u001b[39mstack([\u001b[39m1.0\u001b[39m \u001b[39m-\u001b[39m y_prob, y_prob])\u001b[39m.\u001b[39mtranspose()\n",
      "File \u001b[0;32m~/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/sklearn/metrics/_ranking.py:551\u001b[0m, in \u001b[0;36mroc_auc_score\u001b[0;34m(y_true, y_score, average, sample_weight, max_fpr, multi_class, labels)\u001b[0m\n\u001b[1;32m    549\u001b[0m y_type \u001b[39m=\u001b[39m type_of_target(y_true, input_name\u001b[39m=\u001b[39m\u001b[39m\"\u001b[39m\u001b[39my_true\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[1;32m    550\u001b[0m y_true \u001b[39m=\u001b[39m check_array(y_true, ensure_2d\u001b[39m=\u001b[39m\u001b[39mFalse\u001b[39;00m, dtype\u001b[39m=\u001b[39m\u001b[39mNone\u001b[39;00m)\n\u001b[0;32m--> 551\u001b[0m y_score \u001b[39m=\u001b[39m check_array(y_score, ensure_2d\u001b[39m=\u001b[39;49m\u001b[39mFalse\u001b[39;49;00m)\n\u001b[1;32m    553\u001b[0m \u001b[39mif\u001b[39;00m y_type \u001b[39m==\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mmulticlass\u001b[39m\u001b[39m\"\u001b[39m \u001b[39mor\u001b[39;00m (\n\u001b[1;32m    554\u001b[0m     y_type \u001b[39m==\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mbinary\u001b[39m\u001b[39m\"\u001b[39m \u001b[39mand\u001b[39;00m y_score\u001b[39m.\u001b[39mndim \u001b[39m==\u001b[39m \u001b[39m2\u001b[39m \u001b[39mand\u001b[39;00m y_score\u001b[39m.\u001b[39mshape[\u001b[39m1\u001b[39m] \u001b[39m>\u001b[39m \u001b[39m2\u001b[39m\n\u001b[1;32m    555\u001b[0m ):\n\u001b[1;32m    556\u001b[0m     \u001b[39m# do not support partial ROC computation for multiclass\u001b[39;00m\n\u001b[1;32m    557\u001b[0m     \u001b[39mif\u001b[39;00m max_fpr \u001b[39mis\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mNone\u001b[39;00m \u001b[39mand\u001b[39;00m max_fpr \u001b[39m!=\u001b[39m \u001b[39m1.0\u001b[39m:\n",
      "File \u001b[0;32m~/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/sklearn/utils/validation.py:921\u001b[0m, in \u001b[0;36mcheck_array\u001b[0;34m(array, accept_sparse, accept_large_sparse, dtype, order, copy, force_all_finite, ensure_2d, allow_nd, ensure_min_samples, ensure_min_features, estimator, input_name)\u001b[0m\n\u001b[1;32m    915\u001b[0m         \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(\n\u001b[1;32m    916\u001b[0m             \u001b[39m\"\u001b[39m\u001b[39mFound array with dim \u001b[39m\u001b[39m%d\u001b[39;00m\u001b[39m. \u001b[39m\u001b[39m%s\u001b[39;00m\u001b[39m expected <= 2.\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m    917\u001b[0m             \u001b[39m%\u001b[39m (array\u001b[39m.\u001b[39mndim, estimator_name)\n\u001b[1;32m    918\u001b[0m         )\n\u001b[1;32m    920\u001b[0m     \u001b[39mif\u001b[39;00m force_all_finite:\n\u001b[0;32m--> 921\u001b[0m         _assert_all_finite(\n\u001b[1;32m    922\u001b[0m             array,\n\u001b[1;32m    923\u001b[0m             input_name\u001b[39m=\u001b[39;49minput_name,\n\u001b[1;32m    924\u001b[0m             estimator_name\u001b[39m=\u001b[39;49mestimator_name,\n\u001b[1;32m    925\u001b[0m             allow_nan\u001b[39m=\u001b[39;49mforce_all_finite \u001b[39m==\u001b[39;49m \u001b[39m\"\u001b[39;49m\u001b[39mallow-nan\u001b[39;49m\u001b[39m\"\u001b[39;49m,\n\u001b[1;32m    926\u001b[0m         )\n\u001b[1;32m    928\u001b[0m \u001b[39mif\u001b[39;00m ensure_min_samples \u001b[39m>\u001b[39m \u001b[39m0\u001b[39m:\n\u001b[1;32m    929\u001b[0m     n_samples \u001b[39m=\u001b[39m _num_samples(array)\n",
      "File \u001b[0;32m~/miniconda3/envs/lohi_benchmark/lib/python3.10/site-packages/sklearn/utils/validation.py:161\u001b[0m, in \u001b[0;36m_assert_all_finite\u001b[0;34m(X, allow_nan, msg_dtype, estimator_name, input_name)\u001b[0m\n\u001b[1;32m    144\u001b[0m \u001b[39mif\u001b[39;00m estimator_name \u001b[39mand\u001b[39;00m input_name \u001b[39m==\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mX\u001b[39m\u001b[39m\"\u001b[39m \u001b[39mand\u001b[39;00m has_nan_error:\n\u001b[1;32m    145\u001b[0m     \u001b[39m# Improve the error message on how to handle missing values in\u001b[39;00m\n\u001b[1;32m    146\u001b[0m     \u001b[39m# scikit-learn.\u001b[39;00m\n\u001b[1;32m    147\u001b[0m     msg_err \u001b[39m+\u001b[39m\u001b[39m=\u001b[39m (\n\u001b[1;32m    148\u001b[0m         \u001b[39mf\u001b[39m\u001b[39m\"\u001b[39m\u001b[39m\\n\u001b[39;00m\u001b[39m{\u001b[39;00mestimator_name\u001b[39m}\u001b[39;00m\u001b[39m does not accept missing values\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m    149\u001b[0m         \u001b[39m\"\u001b[39m\u001b[39m encoded as NaN natively. For supervised learning, you might want\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    159\u001b[0m         \u001b[39m\"\u001b[39m\u001b[39m#estimators-that-handle-nan-values\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m    160\u001b[0m     )\n\u001b[0;32m--> 161\u001b[0m \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(msg_err)\n",
      "\u001b[0;31mValueError\u001b[0m: Input contains NaN."
     ]
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>smiles</th>\n",
       "      <th>value</th>\n",
       "      <th>preds</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>383</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2cccc(C(=O)N3CCCCC3)c2)CC1</td>\n",
       "      <td>True</td>\n",
       "      <td>0.148691</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>386</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2cccc(CN3CCCCC3=O)c2)CC1</td>\n",
       "      <td>True</td>\n",
       "      <td>0.137544</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>389</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2ccccc2CN2CCCCC2=O)CC1</td>\n",
       "      <td>True</td>\n",
       "      <td>0.049242</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2695</td>\n",
       "      <td>COc1ccccc1N1CCN(CC2COCC(c3ccccc3)(c3ccccc3)O2)CC1</td>\n",
       "      <td>True</td>\n",
       "      <td>0.029785</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2995</td>\n",
       "      <td>COc1ccccc1N1CCN(C[C@H]2OCCOC2(c2ccccc2)c2ccccc...</td>\n",
       "      <td>False</td>\n",
       "      <td>0.523535</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1186</th>\n",
       "      <td>5766</td>\n",
       "      <td>O=S(=O)(c1ccccc1)c1cnc2c(N3CCNCC3)cccc2c1</td>\n",
       "      <td>True</td>\n",
       "      <td>0.073102</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1187</th>\n",
       "      <td>6025</td>\n",
       "      <td>O[C@H]1[C@@H](NC[C@@H]2COc3ccccc3O2)CC[C@@H]1O...</td>\n",
       "      <td>False</td>\n",
       "      <td>0.044055</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1188</th>\n",
       "      <td>6018</td>\n",
       "      <td>O[C@@H]1[C@H](NC[C@@H]2COc3ccccc3O2)CC[C@H]1Oc...</td>\n",
       "      <td>False</td>\n",
       "      <td>0.737260</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1189</th>\n",
       "      <td>6019</td>\n",
       "      <td>O[C@@H]1[C@H](NC[C@H]2COc3ccccc3O2)CC[C@H]1Oc1...</td>\n",
       "      <td>False</td>\n",
       "      <td>0.058900</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1190</th>\n",
       "      <td>6026</td>\n",
       "      <td>O[C@H]1[C@@H](NC[C@H]2COc3ccccc3O2)CC[C@@H]1Oc...</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1191 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      Unnamed: 0                                             smiles  value  \\\n",
       "0            383   CC(C)Oc1ccccc1N1CCN(Cc2cccc(C(=O)N3CCCCC3)c2)CC1   True   \n",
       "1            386     CC(C)Oc1ccccc1N1CCN(Cc2cccc(CN3CCCCC3=O)c2)CC1   True   \n",
       "2            389       CC(C)Oc1ccccc1N1CCN(Cc2ccccc2CN2CCCCC2=O)CC1   True   \n",
       "3           2695  COc1ccccc1N1CCN(CC2COCC(c3ccccc3)(c3ccccc3)O2)CC1   True   \n",
       "4           2995  COc1ccccc1N1CCN(C[C@H]2OCCOC2(c2ccccc2)c2ccccc...  False   \n",
       "...          ...                                                ...    ...   \n",
       "1186        5766          O=S(=O)(c1ccccc1)c1cnc2c(N3CCNCC3)cccc2c1   True   \n",
       "1187        6025  O[C@H]1[C@@H](NC[C@@H]2COc3ccccc3O2)CC[C@@H]1O...  False   \n",
       "1188        6018  O[C@@H]1[C@H](NC[C@@H]2COc3ccccc3O2)CC[C@H]1Oc...  False   \n",
       "1189        6019  O[C@@H]1[C@H](NC[C@H]2COc3ccccc3O2)CC[C@H]1Oc1...  False   \n",
       "1190        6026  O[C@H]1[C@@H](NC[C@H]2COc3ccccc3O2)CC[C@@H]1Oc...  False   \n",
       "\n",
       "         preds  \n",
       "0     0.148691  \n",
       "1     0.137544  \n",
       "2     0.049242  \n",
       "3     0.029785  \n",
       "4     0.523535  \n",
       "...        ...  \n",
       "1186  0.073102  \n",
       "1187  0.044055  \n",
       "1188  0.737260  \n",
       "1189  0.058900  \n",
       "1190       NaN  \n",
       "\n",
       "[1191 rows x 4 columns]"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>smiles</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>383</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2cccc(C(=O)N3CCCCC3)c2)CC1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>386</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2cccc(CN3CCCCC3=O)c2)CC1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>389</td>\n",
       "      <td>CC(C)Oc1ccccc1N1CCN(Cc2ccccc2CN2CCCCC2=O)CC1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2695</td>\n",
       "      <td>COc1ccccc1N1CCN(CC2COCC(c3ccccc3)(c3ccccc3)O2)CC1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2995</td>\n",
       "      <td>COc1ccccc1N1CCN(C[C@H]2OCCOC2(c2ccccc2)c2ccccc...</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1186</th>\n",
       "      <td>5766</td>\n",
       "      <td>O=S(=O)(c1ccccc1)c1cnc2c(N3CCNCC3)cccc2c1</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1187</th>\n",
       "      <td>6025</td>\n",
       "      <td>O[C@H]1[C@@H](NC[C@@H]2COc3ccccc3O2)CC[C@@H]1O...</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1188</th>\n",
       "      <td>6018</td>\n",
       "      <td>O[C@@H]1[C@H](NC[C@@H]2COc3ccccc3O2)CC[C@H]1Oc...</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1189</th>\n",
       "      <td>6019</td>\n",
       "      <td>O[C@@H]1[C@H](NC[C@H]2COc3ccccc3O2)CC[C@H]1Oc1...</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1190</th>\n",
       "      <td>6026</td>\n",
       "      <td>O[C@H]1[C@@H](NC[C@H]2COc3ccccc3O2)CC[C@@H]1Oc...</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1191 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      Unnamed: 0                                             smiles  value\n",
       "0            383   CC(C)Oc1ccccc1N1CCN(Cc2cccc(C(=O)N3CCCCC3)c2)CC1   True\n",
       "1            386     CC(C)Oc1ccccc1N1CCN(Cc2cccc(CN3CCCCC3=O)c2)CC1   True\n",
       "2            389       CC(C)Oc1ccccc1N1CCN(Cc2ccccc2CN2CCCCC2=O)CC1   True\n",
       "3           2695  COc1ccccc1N1CCN(CC2COCC(c3ccccc3)(c3ccccc3)O2)CC1   True\n",
       "4           2995  COc1ccccc1N1CCN(C[C@H]2OCCOC2(c2ccccc2)c2ccccc...  False\n",
       "...          ...                                                ...    ...\n",
       "1186        5766          O=S(=O)(c1ccccc1)c1cnc2c(N3CCNCC3)cccc2c1   True\n",
       "1187        6025  O[C@H]1[C@@H](NC[C@@H]2COc3ccccc3O2)CC[C@@H]1O...  False\n",
       "1188        6018  O[C@@H]1[C@H](NC[C@@H]2COc3ccccc3O2)CC[C@H]1Oc...  False\n",
       "1189        6019  O[C@@H]1[C@H](NC[C@H]2COc3ccccc3O2)CC[C@H]1Oc1...  False\n",
       "1190        6026  O[C@H]1[C@@H](NC[C@H]2COc3ccccc3O2)CC[C@@H]1Oc...  False\n",
       "\n",
       "[1191 rows x 3 columns]"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "lohi_benchmark",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.17"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "6866b008e29a6b93725c754ff35518c878854bf4c51b70cc5a6a33e53883e114"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
