{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "316f0514",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-a0bf155a-639b-5746-92c8-243d8972b5a9\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "d2e28869",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(LSTM_layers = 1, batch_size = 8, beta = 0.15, Lambda = 0.15, \n",
    "               learning_rate = 5e-5, task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    options['use_cuda'] = True\n",
    "    \n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    options['vocab_dir'] = f'../MINERVA/datasets/data_preprocessed/nell-995/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_NELL-sub-tune/'\n",
    "        options['output_dir'] = './outputs_NELL-sub-tune/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_NELL-sub-tune/'\n",
    "        options['model_dir'] = f'./outputs_NELL-sub-tune/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_NELL-sub-tune/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = LSTM_layers\n",
    "    options['max_num_actions'] = 70\n",
    "    options['gnn_layer'] = 1\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 70\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = batch_size\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = beta\n",
    "    options['Lambda'] = Lambda\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = learning_rate\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 200\n",
    "    options['total_iterations'] = 2000#*(64/batch_size)\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "976c8391",
   "metadata": {},
   "outputs": [],
   "source": [
    "# from model.ours2 import *\n",
    "\n",
    "# results = {}\n",
    "# for layer in [1, 2]:\n",
    "#     for bl in [0.1, 0.08, 0.12, 0.05, 0.15, 0.02, 0.18]:\n",
    "#         for bs in [32, 64, 128]:\n",
    "#             for lr in [1e-4, 5e-5, 5e-4, 1e-3, 1e-5]:\n",
    "#                 params = set_params(layer, bs, bl, bl, lr)\n",
    "#                 name = f'{layer}-{bs}-{bl}-{bl}-{lr}'\n",
    "\n",
    "#                 trainer = Trainer(params)\n",
    "#                 trainer.train()\n",
    "#                 torch.cuda.empty_cache()\n",
    "\n",
    "#                 trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "#                 trainer.agent.eval()\n",
    "#                 trainer.test_environment = trainer.test_test_environment\n",
    "#                 tmp = trainer.test(beam=True, print_paths=False, save_model=False)\n",
    "\n",
    "#                 print(name)\n",
    "#                 print(tmp)\n",
    "#                 print('-------------')\n",
    "#                 results[name] = tmp\n",
    "\n",
    "#                 with open(params['output_dir'] + 'results_table.pk5', 'wb') as f:\n",
    "#                     pickle5.dump(results, f)\n",
    "                    \n",
    "#                 del trainer\n",
    "#                 gc.collect()\n",
    "#                 torch.cuda.empty_cache()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "edcae455",
   "metadata": {},
   "source": [
    "# Testing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "ef9730d1",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('./outputs_NELL-sub-tune/' + 'results_table.pk5', 'rb') as f:\n",
    "    results = pickle5.load(f)\n",
    "check = pd.DataFrame([[k, float(v.split(': ')[-1])] for k,v in results.items()], columns = ['config', 'mrr'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "ca71352c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>config</th>\n",
       "      <th>mrr</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>188</th>\n",
       "      <td>2-64-0.02-0.02-0.001</td>\n",
       "      <td>0.3169</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>193</th>\n",
       "      <td>2-128-0.02-0.02-0.001</td>\n",
       "      <td>0.3228</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>78</th>\n",
       "      <td>1-32-0.02-0.02-0.001</td>\n",
       "      <td>0.3315</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>88</th>\n",
       "      <td>1-128-0.02-0.02-0.001</td>\n",
       "      <td>0.3397</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>187</th>\n",
       "      <td>2-64-0.02-0.02-0.0005</td>\n",
       "      <td>0.3430</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>1-64-0.1-0.1-0.0001</td>\n",
       "      <td>0.5466</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>176</th>\n",
       "      <td>2-128-0.15-0.15-5e-05</td>\n",
       "      <td>0.5469</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>195</th>\n",
       "      <td>2-32-0.18-0.18-0.0001</td>\n",
       "      <td>0.5470</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>196</th>\n",
       "      <td>2-32-0.18-0.18-5e-05</td>\n",
       "      <td>0.5472</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>165</th>\n",
       "      <td>2-32-0.15-0.15-0.0001</td>\n",
       "      <td>0.5474</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>210 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    config     mrr\n",
       "188   2-64-0.02-0.02-0.001  0.3169\n",
       "193  2-128-0.02-0.02-0.001  0.3228\n",
       "78    1-32-0.02-0.02-0.001  0.3315\n",
       "88   1-128-0.02-0.02-0.001  0.3397\n",
       "187  2-64-0.02-0.02-0.0005  0.3430\n",
       "..                     ...     ...\n",
       "5      1-64-0.1-0.1-0.0001  0.5466\n",
       "176  2-128-0.15-0.15-5e-05  0.5469\n",
       "195  2-32-0.18-0.18-0.0001  0.5470\n",
       "196   2-32-0.18-0.18-5e-05  0.5472\n",
       "165  2-32-0.15-0.15-0.0001  0.5474\n",
       "\n",
       "[210 rows x 2 columns]"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "check.sort_values('mrr')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "4bd6c32e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/miniconda3/lib/python3.10/site-packages/torch/nn/_reduction.py:42: UserWarning: size_average and reduce args will be deprecated, please use reduction='none' instead.\n",
      "  warnings.warn(warning.format(ret))\n",
      "/root/Research/GraphRL/Ours/model/ours2.py:334: UserWarning: Implicit dimension choice for log_softmax has been deprecated. Change the call to include dim=X as an argument.\n",
      "  return loss, new_state, F.log_softmax(scores), label_action, chosen_relation\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 20, Train loss: -0.3210, rewards: 0.1596\n",
      "Iteration: 40, Train loss: -0.3281, rewards: 0.3005\n",
      "Iteration: 60, Train loss: -0.3281, rewards: 0.3605\n",
      "Iteration: 80, Train loss: -0.2818, rewards: 0.3395\n",
      "Iteration: 100, Train loss: -0.3002, rewards: 0.3817\n",
      "Iteration: 120, Train loss: -0.2369, rewards: 0.4731\n",
      "Iteration: 140, Train loss: -0.2978, rewards: 0.4400\n",
      "Iteration: 160, Train loss: -0.1922, rewards: 0.4974\n",
      "Iteration: 180, Train loss: -0.2260, rewards: 0.5445\n",
      "Iteration: 200, Train loss: -0.2594, rewards: 0.5424\n",
      "Eval:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/Research/GraphRL/Ours/model/ours2.py:636: UserWarning: __floordiv__ is deprecated, and its behavior will change in a future version of pytorch. It currently rounds toward 0 (like the 'trunc' function NOT 'floor'). This results in incorrect rounding for negative values. To keep the current behavior, use torch.div(a, b, rounding_mode='trunc'), or for actual floor division, use torch.div(a, b, rounding_mode='floor').\n",
      "  y = idx // self.max_num_actions\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hits@1: 0.5862, Hits@3: 0.6515, Hits@10: 0.6850, MRR: 0.6237\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.2489, rewards: 0.5159\n",
      "Iteration: 240, Train loss: -0.2515, rewards: 0.5505\n",
      "Iteration: 260, Train loss: -0.2673, rewards: 0.4759\n",
      "Iteration: 280, Train loss: -0.2142, rewards: 0.5600\n",
      "Iteration: 300, Train loss: -0.1380, rewards: 0.5539\n",
      "Iteration: 320, Train loss: -0.1908, rewards: 0.5513\n",
      "Iteration: 340, Train loss: -0.1693, rewards: 0.5256\n",
      "Iteration: 360, Train loss: -0.1714, rewards: 0.5593\n",
      "Iteration: 380, Train loss: -0.1361, rewards: 0.5440\n",
      "Iteration: 400, Train loss: -0.1528, rewards: 0.5280\n",
      "Eval:\n",
      "Hits@1: 0.5991, Hits@3: 0.6683, Hits@10: 0.6989, MRR: 0.6370\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.2059, rewards: 0.5437\n",
      "Iteration: 440, Train loss: -0.1365, rewards: 0.5709\n",
      "Iteration: 460, Train loss: -0.1765, rewards: 0.6014\n",
      "Iteration: 480, Train loss: -0.1391, rewards: 0.5732\n",
      "Iteration: 500, Train loss: -0.1226, rewards: 0.5867\n",
      "Iteration: 520, Train loss: -0.1523, rewards: 0.5963\n",
      "Iteration: 540, Train loss: -0.1561, rewards: 0.5848\n",
      "Iteration: 560, Train loss: -0.1680, rewards: 0.5947\n",
      "Iteration: 580, Train loss: -0.1120, rewards: 0.5673\n",
      "Iteration: 600, Train loss: -0.1024, rewards: 0.5845\n",
      "Eval:\n",
      "Hits@1: 0.6265, Hits@3: 0.6802, Hits@10: 0.7070, MRR: 0.6568\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.1347, rewards: 0.5624\n",
      "Iteration: 640, Train loss: -0.0837, rewards: 0.5957\n",
      "Iteration: 660, Train loss: -0.1567, rewards: 0.6099\n",
      "Iteration: 680, Train loss: -0.1513, rewards: 0.6056\n",
      "Iteration: 700, Train loss: -0.1241, rewards: 0.5923\n",
      "Iteration: 720, Train loss: -0.1171, rewards: 0.6121\n",
      "Iteration: 740, Train loss: -0.1515, rewards: 0.5634\n",
      "Iteration: 760, Train loss: -0.1738, rewards: 0.5784\n",
      "Iteration: 780, Train loss: -0.1629, rewards: 0.5881\n",
      "Iteration: 800, Train loss: -0.1188, rewards: 0.5956\n",
      "Eval:\n",
      "Hits@1: 0.6282, Hits@3: 0.6837, Hits@10: 0.7098, MRR: 0.6598\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.0857, rewards: 0.5892\n",
      "Iteration: 840, Train loss: -0.1246, rewards: 0.5889\n",
      "Iteration: 860, Train loss: -0.0897, rewards: 0.5958\n",
      "Iteration: 880, Train loss: -0.1148, rewards: 0.6039\n",
      "Iteration: 900, Train loss: -0.0627, rewards: 0.6096\n",
      "Iteration: 920, Train loss: -0.1410, rewards: 0.5596\n",
      "Iteration: 940, Train loss: -0.0495, rewards: 0.6030\n",
      "Iteration: 960, Train loss: -0.1136, rewards: 0.6467\n",
      "Iteration: 980, Train loss: -0.0627, rewards: 0.6115\n",
      "Iteration: 1000, Train loss: -0.1106, rewards: 0.5959\n",
      "Eval:\n",
      "Hits@1: 0.6384, Hits@3: 0.6855, Hits@10: 0.7083, MRR: 0.6656\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.0770, rewards: 0.6138\n",
      "Iteration: 1040, Train loss: -0.0452, rewards: 0.6155\n",
      "Iteration: 1060, Train loss: -0.0611, rewards: 0.6066\n",
      "Iteration: 1080, Train loss: -0.0980, rewards: 0.5832\n",
      "Iteration: 1100, Train loss: -0.0997, rewards: 0.6055\n",
      "Iteration: 1120, Train loss: -0.0965, rewards: 0.6366\n",
      "Iteration: 1140, Train loss: -0.0910, rewards: 0.5654\n",
      "Iteration: 1160, Train loss: -0.0767, rewards: 0.6001\n",
      "Iteration: 1180, Train loss: -0.1327, rewards: 0.5987\n",
      "Iteration: 1200, Train loss: -0.0633, rewards: 0.6072\n",
      "Eval:\n",
      "Hits@1: 0.6470, Hits@3: 0.6896, Hits@10: 0.7108, MRR: 0.6716\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.0934, rewards: 0.6199\n",
      "Iteration: 1240, Train loss: -0.1041, rewards: 0.5773\n",
      "Iteration: 1260, Train loss: -0.0335, rewards: 0.6059\n",
      "Iteration: 1280, Train loss: -0.0732, rewards: 0.6485\n",
      "Iteration: 1300, Train loss: -0.0245, rewards: 0.6101\n",
      "Iteration: 1320, Train loss: -0.0450, rewards: 0.6046\n",
      "Iteration: 1340, Train loss: -0.1260, rewards: 0.5807\n",
      "Iteration: 1360, Train loss: -0.0543, rewards: 0.6020\n",
      "Iteration: 1380, Train loss: -0.1481, rewards: 0.5965\n",
      "Iteration: 1400, Train loss: -0.0726, rewards: 0.6198\n",
      "Eval:\n",
      "Hits@1: 0.6551, Hits@3: 0.6931, Hits@10: 0.7146, MRR: 0.6770\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.0864, rewards: 0.6252\n",
      "Iteration: 1440, Train loss: -0.1512, rewards: 0.6045\n",
      "Iteration: 1460, Train loss: -0.0492, rewards: 0.6072\n",
      "Iteration: 1480, Train loss: -0.0791, rewards: 0.6168\n",
      "Iteration: 1500, Train loss: -0.0777, rewards: 0.6094\n",
      "Iteration: 1520, Train loss: -0.1038, rewards: 0.6222\n",
      "Iteration: 1540, Train loss: -0.1193, rewards: 0.6080\n",
      "Iteration: 1560, Train loss: -0.1188, rewards: 0.6112\n",
      "Iteration: 1580, Train loss: -0.1448, rewards: 0.6038\n",
      "Iteration: 1600, Train loss: -0.0433, rewards: 0.6242\n",
      "Eval:\n",
      "Hits@1: 0.6599, Hits@3: 0.6969, Hits@10: 0.7146, MRR: 0.6806\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.0324, rewards: 0.6411\n",
      "Iteration: 1640, Train loss: -0.1017, rewards: 0.6245\n",
      "Iteration: 1660, Train loss: -0.0981, rewards: 0.6277\n",
      "Iteration: 1680, Train loss: -0.1152, rewards: 0.6614\n",
      "Iteration: 1700, Train loss: -0.1037, rewards: 0.6440\n",
      "Iteration: 1720, Train loss: -0.1043, rewards: 0.6270\n",
      "Iteration: 1740, Train loss: -0.1299, rewards: 0.6264\n",
      "Iteration: 1760, Train loss: -0.1230, rewards: 0.6541\n",
      "Iteration: 1780, Train loss: -0.0630, rewards: 0.6141\n",
      "Iteration: 1800, Train loss: -0.0914, rewards: 0.6336\n",
      "Eval:\n",
      "Hits@1: 0.6589, Hits@3: 0.6941, Hits@10: 0.7129, MRR: 0.6790\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.1358, rewards: 0.6412\n",
      "Iteration: 1840, Train loss: -0.0564, rewards: 0.6362\n",
      "Iteration: 1860, Train loss: -0.1237, rewards: 0.6403\n",
      "Iteration: 1880, Train loss: -0.1101, rewards: 0.6359\n",
      "Iteration: 1900, Train loss: -0.1421, rewards: 0.6370\n",
      "Iteration: 1920, Train loss: -0.0433, rewards: 0.6159\n",
      "Iteration: 1940, Train loss: -0.1244, rewards: 0.6292\n",
      "Iteration: 1960, Train loss: -0.0541, rewards: 0.6322\n",
      "Iteration: 1980, Train loss: -0.0779, rewards: 0.6060\n",
      "Iteration: 2000, Train loss: -0.0546, rewards: 0.6458\n",
      "Eval:\n",
      "Hits@1: 0.6584, Hits@3: 0.6954, Hits@10: 0.7126, MRR: 0.6795\n",
      "------------------------------------------------------------\n"
     ]
    }
   ],
   "source": [
    "from model.ours2 import *\n",
    "params = set_params(2, 64, 0.1, 0.1, 0.0001)\n",
    "trainer = Trainer(params)\n",
    "trainer.train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "6f45416b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune//test_beam/ ]\n",
      "Hits@1: 0.5148, Hits@3: 0.5792, Hits@10: 0.6087, MRR: 0.5497\n"
     ]
    }
   ],
   "source": [
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "trainer.test_environment.test_rollouts = 100\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "25e0dbf2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8022111819355913 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6424133360179872 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.5386351072918237 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8098426870748299 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9283305693753454 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.8952725673514818 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.7806568647242221 (193 queries evaluated)\n",
      "WorksFor\n",
      "MINERVA MAP: 0.8160592607445339 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.946194301013578 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8357692470165488 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/{sub_task.lower().strip()}'\n",
    "    print(sub_task)\n",
    "    nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", trainer.data_input_dir+'/sort_test.pairs' )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "164442e1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/miniconda3/lib/python3.10/site-packages/torch/nn/_reduction.py:42: UserWarning: size_average and reduce args will be deprecated, please use reduction='none' instead.\n",
      "  warnings.warn(warning.format(ret))\n",
      "/root/Research/GraphRL/Ours/model/ours2.py:334: UserWarning: Implicit dimension choice for log_softmax has been deprecated. Change the call to include dim=X as an argument.\n",
      "  return loss, new_state, F.log_softmax(scores), label_action, chosen_relation\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 20, Train loss: 0.0793, rewards: 0.8507\n",
      "Iteration: 40, Train loss: 0.1363, rewards: 0.8521\n",
      "Iteration: 60, Train loss: 0.1383, rewards: 0.8750\n",
      "Iteration: 80, Train loss: 0.1245, rewards: 0.8743\n",
      "Iteration: 100, Train loss: 0.1147, rewards: 0.8968\n",
      "Iteration: 120, Train loss: 0.1468, rewards: 0.8797\n",
      "Iteration: 140, Train loss: 0.1647, rewards: 0.8749\n",
      "Iteration: 160, Train loss: 0.1757, rewards: 0.8635\n",
      "Iteration: 180, Train loss: 0.1655, rewards: 0.8937\n",
      "Iteration: 200, Train loss: 0.1487, rewards: 0.8888\n",
      "Eval:\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/Research/GraphRL/Ours/model/ours2.py:636: UserWarning: __floordiv__ is deprecated, and its behavior will change in a future version of pytorch. It currently rounds toward 0 (like the 'trunc' function NOT 'floor'). This results in incorrect rounding for negative values. To keep the current behavior, use torch.div(a, b, rounding_mode='trunc'), or for actual floor division, use torch.div(a, b, rounding_mode='floor').\n",
      "  y = idx // self.max_num_actions\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hits@1: 0.8795, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8912\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: 0.1670, rewards: 0.8835\n",
      "Iteration: 240, Train loss: 0.2019, rewards: 0.8789\n",
      "Iteration: 260, Train loss: 0.1503, rewards: 0.8898\n",
      "Iteration: 280, Train loss: 0.1940, rewards: 0.8877\n",
      "Iteration: 300, Train loss: 0.1754, rewards: 0.8844\n",
      "Iteration: 320, Train loss: 0.1801, rewards: 0.8783\n",
      "Iteration: 340, Train loss: 0.1923, rewards: 0.8747\n",
      "Iteration: 360, Train loss: 0.1878, rewards: 0.8807\n",
      "Iteration: 380, Train loss: 0.1460, rewards: 0.8918\n",
      "Iteration: 400, Train loss: 0.2075, rewards: 0.8641\n",
      "Eval:\n",
      "Hits@1: 0.8667, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8840\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: 0.1733, rewards: 0.8820\n",
      "Iteration: 440, Train loss: 0.2363, rewards: 0.8724\n",
      "Iteration: 460, Train loss: 0.2207, rewards: 0.8757\n",
      "Iteration: 480, Train loss: 0.2124, rewards: 0.8625\n",
      "Iteration: 500, Train loss: 0.1699, rewards: 0.8735\n",
      "Iteration: 520, Train loss: 0.1661, rewards: 0.8871\n",
      "Iteration: 540, Train loss: 0.1912, rewards: 0.8708\n",
      "Iteration: 560, Train loss: 0.1898, rewards: 0.8995\n",
      "Iteration: 580, Train loss: 0.1956, rewards: 0.8891\n",
      "Iteration: 600, Train loss: 0.1950, rewards: 0.8837\n",
      "Eval:\n",
      "Hits@1: 0.8795, Hits@3: 0.9026, Hits@10: 0.9051, MRR: 0.8917\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: 0.1740, rewards: 0.8934\n",
      "Iteration: 640, Train loss: 0.2086, rewards: 0.8862\n",
      "Iteration: 660, Train loss: 0.1859, rewards: 0.8890\n",
      "Iteration: 680, Train loss: 0.2213, rewards: 0.8825\n",
      "Iteration: 700, Train loss: 0.1853, rewards: 0.8925\n",
      "Iteration: 720, Train loss: 0.1552, rewards: 0.8993\n",
      "Iteration: 740, Train loss: 0.2042, rewards: 0.8902\n",
      "Iteration: 760, Train loss: 0.1641, rewards: 0.8952\n",
      "Iteration: 780, Train loss: 0.2279, rewards: 0.8812\n",
      "Iteration: 800, Train loss: 0.2112, rewards: 0.8777\n",
      "Eval:\n",
      "Hits@1: 0.7718, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8369\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: 0.1764, rewards: 0.8828\n",
      "Iteration: 840, Train loss: 0.2067, rewards: 0.8846\n",
      "Iteration: 860, Train loss: 0.2180, rewards: 0.8671\n",
      "Iteration: 880, Train loss: 0.2277, rewards: 0.8784\n",
      "Iteration: 900, Train loss: 0.1962, rewards: 0.8690\n",
      "Iteration: 920, Train loss: 0.2004, rewards: 0.8663\n",
      "Iteration: 940, Train loss: 0.1696, rewards: 0.8924\n",
      "Iteration: 960, Train loss: 0.1496, rewards: 0.8868\n",
      "Iteration: 980, Train loss: 0.1930, rewards: 0.8699\n",
      "Iteration: 1000, Train loss: 0.1602, rewards: 0.8980\n",
      "Eval:\n",
      "Hits@1: 0.8769, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8893\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: 0.1769, rewards: 0.8883\n",
      "Iteration: 1040, Train loss: 0.1896, rewards: 0.8851\n",
      "Iteration: 1060, Train loss: 0.1814, rewards: 0.8887\n",
      "Iteration: 1080, Train loss: 0.2046, rewards: 0.8780\n",
      "Iteration: 1100, Train loss: 0.2129, rewards: 0.8720\n",
      "Iteration: 1120, Train loss: 0.2272, rewards: 0.8682\n",
      "Iteration: 1140, Train loss: 0.1918, rewards: 0.8756\n",
      "Iteration: 1160, Train loss: 0.2060, rewards: 0.8802\n",
      "Iteration: 1180, Train loss: 0.1742, rewards: 0.8945\n",
      "Iteration: 1200, Train loss: 0.1676, rewards: 0.8911\n",
      "Eval:\n",
      "Hits@1: 0.8744, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8876\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: 0.1887, rewards: 0.8773\n",
      "Iteration: 1240, Train loss: 0.1859, rewards: 0.8942\n",
      "Iteration: 1260, Train loss: 0.1665, rewards: 0.8839\n",
      "Iteration: 1280, Train loss: 0.1753, rewards: 0.8708\n",
      "Iteration: 1300, Train loss: 0.1907, rewards: 0.8850\n",
      "Iteration: 1320, Train loss: 0.1855, rewards: 0.8852\n",
      "Iteration: 1340, Train loss: 0.2033, rewards: 0.8928\n",
      "Iteration: 1360, Train loss: 0.2010, rewards: 0.8758\n",
      "Iteration: 1380, Train loss: 0.1669, rewards: 0.8689\n",
      "Iteration: 1400, Train loss: 0.2116, rewards: 0.8804\n",
      "Eval:\n",
      "Hits@1: 0.8308, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.8650\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: 0.1953, rewards: 0.8895\n",
      "Iteration: 1440, Train loss: 0.1851, rewards: 0.8800\n",
      "Iteration: 1460, Train loss: 0.1480, rewards: 0.8946\n",
      "Iteration: 1480, Train loss: 0.1702, rewards: 0.8926\n",
      "Iteration: 1500, Train loss: 0.1462, rewards: 0.8928\n",
      "Iteration: 1520, Train loss: 0.1639, rewards: 0.8982\n",
      "Iteration: 1540, Train loss: 0.1425, rewards: 0.8936\n",
      "Iteration: 1560, Train loss: 0.1948, rewards: 0.8842\n",
      "Iteration: 1580, Train loss: 0.2065, rewards: 0.8721\n",
      "Iteration: 1600, Train loss: 0.1671, rewards: 0.8979\n",
      "Eval:\n",
      "Hits@1: 0.6513, Hits@3: 0.8974, Hits@10: 0.9026, MRR: 0.7615\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: 0.2054, rewards: 0.8861\n",
      "Iteration: 1640, Train loss: 0.1984, rewards: 0.8766\n",
      "Iteration: 1660, Train loss: 0.2057, rewards: 0.8863\n",
      "Iteration: 1680, Train loss: 0.2138, rewards: 0.8702\n",
      "Iteration: 1700, Train loss: 0.1866, rewards: 0.8911\n",
      "Iteration: 1720, Train loss: 0.2113, rewards: 0.8803\n",
      "Iteration: 1740, Train loss: 0.1794, rewards: 0.8870\n",
      "Iteration: 1760, Train loss: 0.1939, rewards: 0.8840\n",
      "Iteration: 1780, Train loss: 0.1858, rewards: 0.8862\n",
      "Iteration: 1800, Train loss: 0.2386, rewards: 0.8700\n",
      "Eval:\n",
      "Hits@1: 0.6795, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.7906\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: 0.1892, rewards: 0.8938\n",
      "Iteration: 1840, Train loss: 0.1823, rewards: 0.8879\n",
      "Iteration: 1860, Train loss: 0.1949, rewards: 0.8706\n",
      "Iteration: 1880, Train loss: 0.1825, rewards: 0.8831\n",
      "Iteration: 1900, Train loss: 0.1748, rewards: 0.8968\n",
      "Iteration: 1920, Train loss: 0.1716, rewards: 0.8976\n",
      "Iteration: 1940, Train loss: 0.1462, rewards: 0.8951\n",
      "Iteration: 1960, Train loss: 0.2351, rewards: 0.8793\n",
      "Iteration: 1980, Train loss: 0.1862, rewards: 0.8813\n",
      "Iteration: 2000, Train loss: 0.1664, rewards: 0.8914\n",
      "Eval:\n",
      "Hits@1: 0.6026, Hits@3: 0.9026, Hits@10: 0.9026, MRR: 0.7521\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/athleteplaysinleague//test_beam/ ]\n",
      "Hits@1: 0.8163, Hits@3: 0.8478, Hits@10: 0.8478, MRR: 0.8316\n",
      "MINERVA MAP: 0.9727471566054243 (381 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.1919, rewards: 0.5143\n",
      "Iteration: 40, Train loss: -0.2594, rewards: 0.5306\n",
      "Iteration: 60, Train loss: -0.2746, rewards: 0.5385\n",
      "Iteration: 80, Train loss: -0.2767, rewards: 0.5545\n",
      "Iteration: 100, Train loss: -0.2249, rewards: 0.5502\n",
      "Iteration: 120, Train loss: -0.2371, rewards: 0.5389\n",
      "Iteration: 140, Train loss: -0.2829, rewards: 0.5469\n",
      "Iteration: 160, Train loss: -0.3021, rewards: 0.5415\n",
      "Iteration: 180, Train loss: -0.2572, rewards: 0.5809\n",
      "Iteration: 200, Train loss: -0.2968, rewards: 0.5419\n",
      "Eval:\n",
      "Hits@1: 0.5157, Hits@3: 0.5916, Hits@10: 0.6309, MRR: 0.5594\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.3095, rewards: 0.5616\n",
      "Iteration: 240, Train loss: -0.3266, rewards: 0.5539\n",
      "Iteration: 260, Train loss: -0.3260, rewards: 0.5290\n",
      "Iteration: 280, Train loss: -0.3803, rewards: 0.5661\n",
      "Iteration: 300, Train loss: -0.3735, rewards: 0.5690\n",
      "Iteration: 320, Train loss: -0.3641, rewards: 0.5540\n",
      "Iteration: 340, Train loss: -0.3739, rewards: 0.5901\n",
      "Iteration: 360, Train loss: -0.4243, rewards: 0.5739\n",
      "Iteration: 380, Train loss: -0.4345, rewards: 0.5938\n",
      "Iteration: 400, Train loss: -0.4347, rewards: 0.5943\n",
      "Eval:\n",
      "Hits@1: 0.5236, Hits@3: 0.5864, Hits@10: 0.6204, MRR: 0.5614\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.4343, rewards: 0.5736\n",
      "Iteration: 440, Train loss: -0.4246, rewards: 0.5839\n",
      "Iteration: 460, Train loss: -0.4049, rewards: 0.5845\n",
      "Iteration: 480, Train loss: -0.4154, rewards: 0.5688\n",
      "Iteration: 500, Train loss: -0.3841, rewards: 0.5910\n",
      "Iteration: 520, Train loss: -0.3995, rewards: 0.6196\n",
      "Iteration: 540, Train loss: -0.3730, rewards: 0.5853\n",
      "Iteration: 560, Train loss: -0.4446, rewards: 0.5748\n",
      "Iteration: 580, Train loss: -0.4285, rewards: 0.6122\n",
      "Iteration: 600, Train loss: -0.4256, rewards: 0.5982\n",
      "Eval:\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hits@1: 0.5524, Hits@3: 0.5838, Hits@10: 0.6152, MRR: 0.5760\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.4124, rewards: 0.5971\n",
      "Iteration: 640, Train loss: -0.4030, rewards: 0.6068\n",
      "Iteration: 660, Train loss: -0.4100, rewards: 0.5891\n",
      "Iteration: 680, Train loss: -0.3699, rewards: 0.6144\n",
      "Iteration: 700, Train loss: -0.3821, rewards: 0.6081\n",
      "Iteration: 720, Train loss: -0.3921, rewards: 0.6049\n",
      "Iteration: 740, Train loss: -0.4478, rewards: 0.6170\n",
      "Iteration: 760, Train loss: -0.4174, rewards: 0.5896\n",
      "Iteration: 780, Train loss: -0.4530, rewards: 0.5792\n",
      "Iteration: 800, Train loss: -0.4777, rewards: 0.5854\n",
      "Eval:\n",
      "Hits@1: 0.5419, Hits@3: 0.5890, Hits@10: 0.6099, MRR: 0.5735\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.4451, rewards: 0.5968\n",
      "Iteration: 840, Train loss: -0.4490, rewards: 0.5888\n",
      "Iteration: 860, Train loss: -0.4730, rewards: 0.5861\n",
      "Iteration: 880, Train loss: -0.4266, rewards: 0.5814\n",
      "Iteration: 900, Train loss: -0.4221, rewards: 0.6043\n",
      "Iteration: 920, Train loss: -0.4564, rewards: 0.5957\n",
      "Iteration: 940, Train loss: -0.3911, rewards: 0.5791\n",
      "Iteration: 960, Train loss: -0.4369, rewards: 0.5995\n",
      "Iteration: 980, Train loss: -0.4469, rewards: 0.5957\n",
      "Iteration: 1000, Train loss: -0.4040, rewards: 0.5979\n",
      "Eval:\n",
      "Hits@1: 0.5393, Hits@3: 0.5942, Hits@10: 0.6178, MRR: 0.5740\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.4493, rewards: 0.5935\n",
      "Iteration: 1040, Train loss: -0.4430, rewards: 0.6049\n",
      "Iteration: 1060, Train loss: -0.4063, rewards: 0.6042\n",
      "Iteration: 1080, Train loss: -0.4365, rewards: 0.5878\n",
      "Iteration: 1100, Train loss: -0.4033, rewards: 0.5775\n",
      "Iteration: 1120, Train loss: -0.3968, rewards: 0.6046\n",
      "Iteration: 1140, Train loss: -0.4176, rewards: 0.5969\n",
      "Iteration: 1160, Train loss: -0.4472, rewards: 0.6022\n",
      "Iteration: 1180, Train loss: -0.4260, rewards: 0.6213\n",
      "Iteration: 1200, Train loss: -0.4067, rewards: 0.5871\n",
      "Eval:\n",
      "Hits@1: 0.5419, Hits@3: 0.5995, Hits@10: 0.6335, MRR: 0.5787\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.4293, rewards: 0.6188\n",
      "Iteration: 1240, Train loss: -0.4539, rewards: 0.6214\n",
      "Iteration: 1260, Train loss: -0.4829, rewards: 0.5855\n",
      "Iteration: 1280, Train loss: -0.4691, rewards: 0.6111\n",
      "Iteration: 1300, Train loss: -0.4307, rewards: 0.6121\n",
      "Iteration: 1320, Train loss: -0.4226, rewards: 0.6151\n",
      "Iteration: 1340, Train loss: -0.4572, rewards: 0.5859\n",
      "Iteration: 1360, Train loss: -0.4121, rewards: 0.6101\n",
      "Iteration: 1380, Train loss: -0.4199, rewards: 0.5996\n",
      "Iteration: 1400, Train loss: -0.4105, rewards: 0.6000\n",
      "Eval:\n",
      "Hits@1: 0.5497, Hits@3: 0.5995, Hits@10: 0.6204, MRR: 0.5796\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.4493, rewards: 0.6254\n",
      "Iteration: 1440, Train loss: -0.3861, rewards: 0.6302\n",
      "Iteration: 1460, Train loss: -0.3872, rewards: 0.6182\n",
      "Iteration: 1480, Train loss: -0.4437, rewards: 0.5895\n",
      "Iteration: 1500, Train loss: -0.3776, rewards: 0.5976\n",
      "Iteration: 1520, Train loss: -0.4267, rewards: 0.5825\n",
      "Iteration: 1540, Train loss: -0.3899, rewards: 0.6053\n",
      "Iteration: 1560, Train loss: -0.3707, rewards: 0.6019\n",
      "Iteration: 1580, Train loss: -0.3737, rewards: 0.6034\n",
      "Iteration: 1600, Train loss: -0.3615, rewards: 0.6009\n",
      "Eval:\n",
      "Hits@1: 0.5524, Hits@3: 0.6021, Hits@10: 0.6283, MRR: 0.5831\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.4037, rewards: 0.6163\n",
      "Iteration: 1640, Train loss: -0.3954, rewards: 0.6154\n",
      "Iteration: 1660, Train loss: -0.4193, rewards: 0.6153\n",
      "Iteration: 1680, Train loss: -0.4021, rewards: 0.6107\n",
      "Iteration: 1700, Train loss: -0.3991, rewards: 0.6200\n",
      "Iteration: 1720, Train loss: -0.3689, rewards: 0.6186\n",
      "Iteration: 1740, Train loss: -0.4168, rewards: 0.6042\n",
      "Iteration: 1760, Train loss: -0.4381, rewards: 0.6327\n",
      "Iteration: 1780, Train loss: -0.4210, rewards: 0.6278\n",
      "Iteration: 1800, Train loss: -0.3637, rewards: 0.6257\n",
      "Eval:\n",
      "Hits@1: 0.5524, Hits@3: 0.6021, Hits@10: 0.6283, MRR: 0.5855\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.3940, rewards: 0.6432\n",
      "Iteration: 1840, Train loss: -0.3612, rewards: 0.5950\n",
      "Iteration: 1860, Train loss: -0.4357, rewards: 0.6103\n",
      "Iteration: 1880, Train loss: -0.4150, rewards: 0.6367\n",
      "Iteration: 1900, Train loss: -0.4150, rewards: 0.6068\n",
      "Iteration: 1920, Train loss: -0.3893, rewards: 0.6101\n",
      "Iteration: 1940, Train loss: -0.3877, rewards: 0.6007\n",
      "Iteration: 1960, Train loss: -0.4300, rewards: 0.6229\n",
      "Iteration: 1980, Train loss: -0.3886, rewards: 0.6182\n",
      "Iteration: 2000, Train loss: -0.4090, rewards: 0.5991\n",
      "Eval:\n",
      "Hits@1: 0.5628, Hits@3: 0.5995, Hits@10: 0.6230, MRR: 0.5896\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/athleteplaysforteam//test_beam/ ]\n",
      "Hits@1: 0.4935, Hits@3: 0.5711, Hits@10: 0.6047, MRR: 0.5389\n",
      "MINERVA MAP: 0.8109486336230524 (387 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.3527, rewards: 0.6693\n",
      "Iteration: 40, Train loss: -0.1716, rewards: 0.7665\n",
      "Iteration: 60, Train loss: -0.1647, rewards: 0.7837\n",
      "Iteration: 80, Train loss: -0.1976, rewards: 0.7828\n",
      "Iteration: 100, Train loss: -0.1889, rewards: 0.8024\n",
      "Iteration: 120, Train loss: -0.0997, rewards: 0.8492\n",
      "Iteration: 140, Train loss: -0.0759, rewards: 0.8576\n",
      "Iteration: 160, Train loss: -0.0773, rewards: 0.8459\n",
      "Iteration: 180, Train loss: -0.0341, rewards: 0.8725\n",
      "Iteration: 200, Train loss: 0.0000, rewards: 0.8546\n",
      "Eval:\n",
      "Hits@1: 0.8209, Hits@3: 0.8756, Hits@10: 0.8905, MRR: 0.8518\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.0026, rewards: 0.8657\n",
      "Iteration: 240, Train loss: 0.0020, rewards: 0.8673\n",
      "Iteration: 260, Train loss: -0.0148, rewards: 0.8838\n",
      "Iteration: 280, Train loss: -0.0018, rewards: 0.8630\n",
      "Iteration: 300, Train loss: -0.0202, rewards: 0.8665\n",
      "Iteration: 320, Train loss: -0.0012, rewards: 0.8522\n",
      "Iteration: 340, Train loss: -0.0179, rewards: 0.8598\n",
      "Iteration: 360, Train loss: -0.0086, rewards: 0.8720\n",
      "Iteration: 380, Train loss: -0.0012, rewards: 0.8793\n",
      "Iteration: 400, Train loss: 0.0074, rewards: 0.8712\n",
      "Eval:\n",
      "Hits@1: 0.7960, Hits@3: 0.8806, Hits@10: 0.9005, MRR: 0.8412\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.0052, rewards: 0.8685\n",
      "Iteration: 440, Train loss: 0.0022, rewards: 0.8699\n",
      "Iteration: 460, Train loss: 0.0041, rewards: 0.8658\n",
      "Iteration: 480, Train loss: -0.0011, rewards: 0.8657\n",
      "Iteration: 500, Train loss: 0.0152, rewards: 0.8521\n",
      "Iteration: 520, Train loss: -0.0042, rewards: 0.8741\n",
      "Iteration: 540, Train loss: -0.0035, rewards: 0.8691\n",
      "Iteration: 560, Train loss: 0.0068, rewards: 0.8604\n",
      "Iteration: 580, Train loss: 0.0064, rewards: 0.8568\n",
      "Iteration: 600, Train loss: 0.0211, rewards: 0.8741\n",
      "Eval:\n",
      "Hits@1: 0.7811, Hits@3: 0.8706, Hits@10: 0.9055, MRR: 0.8327\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.0105, rewards: 0.8794\n",
      "Iteration: 640, Train loss: 0.0205, rewards: 0.8666\n",
      "Iteration: 660, Train loss: 0.0003, rewards: 0.8518\n",
      "Iteration: 680, Train loss: 0.0033, rewards: 0.8777\n",
      "Iteration: 700, Train loss: -0.0012, rewards: 0.8529\n",
      "Iteration: 720, Train loss: 0.0066, rewards: 0.8770\n",
      "Iteration: 740, Train loss: -0.0085, rewards: 0.8722\n",
      "Iteration: 760, Train loss: -0.0025, rewards: 0.8875\n",
      "Iteration: 780, Train loss: 0.0118, rewards: 0.8625\n",
      "Iteration: 800, Train loss: 0.0202, rewards: 0.8608\n",
      "Eval:\n",
      "Hits@1: 0.8060, Hits@3: 0.8806, Hits@10: 0.9005, MRR: 0.8472\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: 0.0348, rewards: 0.8743\n",
      "Iteration: 840, Train loss: 0.0303, rewards: 0.8577\n",
      "Iteration: 860, Train loss: -0.0031, rewards: 0.8764\n",
      "Iteration: 880, Train loss: 0.0158, rewards: 0.8854\n",
      "Iteration: 900, Train loss: 0.0224, rewards: 0.8729\n",
      "Iteration: 920, Train loss: 0.0262, rewards: 0.8745\n",
      "Iteration: 940, Train loss: 0.0269, rewards: 0.8761\n",
      "Iteration: 960, Train loss: 0.0119, rewards: 0.8835\n",
      "Iteration: 980, Train loss: 0.0331, rewards: 0.8719\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1000, Train loss: 0.0235, rewards: 0.8732\n",
      "Eval:\n",
      "Hits@1: 0.8259, Hits@3: 0.8856, Hits@10: 0.9005, MRR: 0.8574\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: 0.0357, rewards: 0.8770\n",
      "Iteration: 1040, Train loss: 0.0224, rewards: 0.8800\n",
      "Iteration: 1060, Train loss: 0.0197, rewards: 0.8786\n",
      "Iteration: 1080, Train loss: 0.0247, rewards: 0.8725\n",
      "Iteration: 1100, Train loss: 0.0178, rewards: 0.8819\n",
      "Iteration: 1120, Train loss: 0.0247, rewards: 0.8775\n",
      "Iteration: 1140, Train loss: 0.0431, rewards: 0.8452\n",
      "Iteration: 1160, Train loss: 0.0118, rewards: 0.8779\n",
      "Iteration: 1180, Train loss: 0.0239, rewards: 0.8835\n",
      "Iteration: 1200, Train loss: 0.0267, rewards: 0.8798\n",
      "Eval:\n",
      "Hits@1: 0.8358, Hits@3: 0.8856, Hits@10: 0.9104, MRR: 0.8638\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: 0.0385, rewards: 0.8613\n",
      "Iteration: 1240, Train loss: 0.0299, rewards: 0.8526\n",
      "Iteration: 1260, Train loss: 0.0346, rewards: 0.8809\n",
      "Iteration: 1280, Train loss: 0.0234, rewards: 0.8707\n",
      "Iteration: 1300, Train loss: 0.0346, rewards: 0.8838\n",
      "Iteration: 1320, Train loss: 0.0211, rewards: 0.8640\n",
      "Iteration: 1340, Train loss: 0.0179, rewards: 0.8905\n",
      "Iteration: 1360, Train loss: 0.0173, rewards: 0.8600\n",
      "Iteration: 1380, Train loss: 0.0038, rewards: 0.8515\n",
      "Iteration: 1400, Train loss: 0.0169, rewards: 0.8752\n",
      "Eval:\n",
      "Hits@1: 0.8358, Hits@3: 0.8706, Hits@10: 0.8905, MRR: 0.8583\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: 0.0221, rewards: 0.8823\n",
      "Iteration: 1440, Train loss: 0.0309, rewards: 0.8731\n",
      "Iteration: 1460, Train loss: 0.0335, rewards: 0.8668\n",
      "Iteration: 1480, Train loss: 0.0116, rewards: 0.8794\n",
      "Iteration: 1500, Train loss: 0.0296, rewards: 0.8637\n",
      "Iteration: 1520, Train loss: 0.0152, rewards: 0.8667\n",
      "Iteration: 1540, Train loss: 0.0157, rewards: 0.8669\n",
      "Iteration: 1560, Train loss: -0.0031, rewards: 0.8785\n",
      "Iteration: 1580, Train loss: -0.0034, rewards: 0.8601\n",
      "Iteration: 1600, Train loss: 0.0104, rewards: 0.8846\n",
      "Eval:\n",
      "Hits@1: 0.8507, Hits@3: 0.8756, Hits@10: 0.9005, MRR: 0.8670\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: 0.0058, rewards: 0.8582\n",
      "Iteration: 1640, Train loss: 0.0259, rewards: 0.8507\n",
      "Iteration: 1660, Train loss: 0.0036, rewards: 0.8712\n",
      "Iteration: 1680, Train loss: 0.0031, rewards: 0.8748\n",
      "Iteration: 1700, Train loss: 0.0074, rewards: 0.8856\n",
      "Iteration: 1720, Train loss: 0.0011, rewards: 0.8592\n",
      "Iteration: 1740, Train loss: 0.0051, rewards: 0.8656\n",
      "Iteration: 1760, Train loss: 0.0226, rewards: 0.8589\n",
      "Iteration: 1780, Train loss: 0.0175, rewards: 0.8729\n",
      "Iteration: 1800, Train loss: -0.0030, rewards: 0.8649\n",
      "Eval:\n",
      "Hits@1: 0.8507, Hits@3: 0.8806, Hits@10: 0.9005, MRR: 0.8679\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: 0.0327, rewards: 0.8771\n",
      "Iteration: 1840, Train loss: 0.0065, rewards: 0.8599\n",
      "Iteration: 1860, Train loss: -0.0058, rewards: 0.8676\n",
      "Iteration: 1880, Train loss: -0.0003, rewards: 0.8836\n",
      "Iteration: 1900, Train loss: 0.0121, rewards: 0.8791\n",
      "Iteration: 1920, Train loss: -0.0100, rewards: 0.8700\n",
      "Iteration: 1940, Train loss: 0.0263, rewards: 0.8668\n",
      "Iteration: 1960, Train loss: 0.0026, rewards: 0.8638\n",
      "Iteration: 1980, Train loss: 0.0140, rewards: 0.8578\n",
      "Iteration: 2000, Train loss: 0.0218, rewards: 0.8684\n",
      "Eval:\n",
      "Hits@1: 0.8010, Hits@3: 0.8756, Hits@10: 0.8856, MRR: 0.8417\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/athletehomestadium//test_beam/ ]\n",
      "Hits@1: 0.8209, Hits@3: 0.8706, Hits@10: 0.8905, MRR: 0.8480\n",
      "MINERVA MAP: 0.9133484812589291 (201 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.0884, rewards: 0.6240\n",
      "Iteration: 40, Train loss: 0.0086, rewards: 0.6863\n",
      "Iteration: 60, Train loss: 0.0281, rewards: 0.7041\n",
      "Iteration: 80, Train loss: 0.0301, rewards: 0.7121\n",
      "Iteration: 100, Train loss: -0.0082, rewards: 0.7183\n",
      "Iteration: 120, Train loss: -0.0081, rewards: 0.7418\n",
      "Iteration: 140, Train loss: -0.0038, rewards: 0.7571\n",
      "Iteration: 160, Train loss: -0.0059, rewards: 0.7158\n",
      "Iteration: 180, Train loss: -0.0067, rewards: 0.7486\n",
      "Iteration: 200, Train loss: -0.0016, rewards: 0.7434\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.8351, Hits@10: 0.8454, MRR: 0.8050\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: 0.0078, rewards: 0.7464\n",
      "Iteration: 240, Train loss: -0.0289, rewards: 0.7479\n",
      "Iteration: 260, Train loss: 0.0021, rewards: 0.7596\n",
      "Iteration: 280, Train loss: -0.0082, rewards: 0.7698\n",
      "Iteration: 300, Train loss: -0.0828, rewards: 0.8014\n",
      "Iteration: 320, Train loss: -0.0459, rewards: 0.8121\n",
      "Iteration: 340, Train loss: -0.0316, rewards: 0.7938\n",
      "Iteration: 360, Train loss: -0.0308, rewards: 0.8209\n",
      "Iteration: 380, Train loss: -0.0440, rewards: 0.8027\n",
      "Iteration: 400, Train loss: -0.0873, rewards: 0.8118\n",
      "Eval:\n",
      "Hits@1: 0.8454, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8505\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.0433, rewards: 0.8181\n",
      "Iteration: 440, Train loss: -0.0469, rewards: 0.8135\n",
      "Iteration: 460, Train loss: -0.0131, rewards: 0.8198\n",
      "Iteration: 480, Train loss: -0.0642, rewards: 0.8033\n",
      "Iteration: 500, Train loss: -0.0852, rewards: 0.8237\n",
      "Iteration: 520, Train loss: -0.0667, rewards: 0.8196\n",
      "Iteration: 540, Train loss: -0.0680, rewards: 0.8226\n",
      "Iteration: 560, Train loss: -0.0355, rewards: 0.8041\n",
      "Iteration: 580, Train loss: -0.0989, rewards: 0.8368\n",
      "Iteration: 600, Train loss: -0.0559, rewards: 0.8151\n",
      "Eval:\n",
      "Hits@1: 0.8247, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8402\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.0826, rewards: 0.8281\n",
      "Iteration: 640, Train loss: -0.0885, rewards: 0.8223\n",
      "Iteration: 660, Train loss: -0.0310, rewards: 0.8248\n",
      "Iteration: 680, Train loss: -0.1241, rewards: 0.8159\n",
      "Iteration: 700, Train loss: -0.0775, rewards: 0.8153\n",
      "Iteration: 720, Train loss: -0.0846, rewards: 0.8265\n",
      "Iteration: 740, Train loss: -0.1017, rewards: 0.8190\n",
      "Iteration: 760, Train loss: -0.0896, rewards: 0.8224\n",
      "Iteration: 780, Train loss: -0.1000, rewards: 0.8169\n",
      "Iteration: 800, Train loss: -0.0984, rewards: 0.8060\n",
      "Eval:\n",
      "Hits@1: 0.8351, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8454\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.0813, rewards: 0.8205\n",
      "Iteration: 840, Train loss: -0.1043, rewards: 0.8382\n",
      "Iteration: 860, Train loss: -0.0564, rewards: 0.8201\n",
      "Iteration: 880, Train loss: -0.0529, rewards: 0.8211\n",
      "Iteration: 900, Train loss: -0.0751, rewards: 0.8336\n",
      "Iteration: 920, Train loss: -0.0553, rewards: 0.8384\n",
      "Iteration: 940, Train loss: -0.0589, rewards: 0.8283\n",
      "Iteration: 960, Train loss: -0.0516, rewards: 0.8278\n",
      "Iteration: 980, Train loss: -0.0561, rewards: 0.8413\n",
      "Iteration: 1000, Train loss: -0.0767, rewards: 0.8215\n",
      "Eval:\n",
      "Hits@1: 0.8041, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8299\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.0247, rewards: 0.8322\n",
      "Iteration: 1040, Train loss: -0.0241, rewards: 0.8316\n",
      "Iteration: 1060, Train loss: -0.0038, rewards: 0.8239\n",
      "Iteration: 1080, Train loss: -0.0078, rewards: 0.8405\n",
      "Iteration: 1100, Train loss: -0.0652, rewards: 0.8552\n",
      "Iteration: 1120, Train loss: -0.0881, rewards: 0.8280\n",
      "Iteration: 1140, Train loss: -0.0983, rewards: 0.8345\n",
      "Iteration: 1160, Train loss: -0.1108, rewards: 0.8323\n",
      "Iteration: 1180, Train loss: -0.1268, rewards: 0.8343\n",
      "Iteration: 1200, Train loss: -0.1118, rewards: 0.8246\n",
      "Eval:\n",
      "Hits@1: 0.8041, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8299\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.0613, rewards: 0.8396\n",
      "Iteration: 1240, Train loss: -0.1127, rewards: 0.8355\n",
      "Iteration: 1260, Train loss: -0.0573, rewards: 0.8362\n",
      "Iteration: 1280, Train loss: -0.0946, rewards: 0.8102\n",
      "Iteration: 1300, Train loss: -0.0786, rewards: 0.8252\n",
      "Iteration: 1320, Train loss: -0.1189, rewards: 0.8161\n",
      "Iteration: 1340, Train loss: -0.1404, rewards: 0.8196\n",
      "Iteration: 1360, Train loss: -0.1202, rewards: 0.8237\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1380, Train loss: -0.0673, rewards: 0.8404\n",
      "Iteration: 1400, Train loss: -0.0277, rewards: 0.8354\n",
      "Eval:\n",
      "Hits@1: 0.7938, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8230\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.0679, rewards: 0.8284\n",
      "Iteration: 1440, Train loss: -0.0490, rewards: 0.8165\n",
      "Iteration: 1460, Train loss: -0.0244, rewards: 0.8303\n",
      "Iteration: 1480, Train loss: -0.0860, rewards: 0.8359\n",
      "Iteration: 1500, Train loss: -0.1223, rewards: 0.8452\n",
      "Iteration: 1520, Train loss: -0.0336, rewards: 0.8421\n",
      "Iteration: 1540, Train loss: -0.0733, rewards: 0.8334\n",
      "Iteration: 1560, Train loss: -0.1014, rewards: 0.8349\n",
      "Iteration: 1580, Train loss: -0.0791, rewards: 0.8389\n",
      "Iteration: 1600, Train loss: -0.1219, rewards: 0.8489\n",
      "Eval:\n",
      "Hits@1: 0.8041, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8299\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.1154, rewards: 0.8282\n",
      "Iteration: 1640, Train loss: -0.1484, rewards: 0.8412\n",
      "Iteration: 1660, Train loss: -0.1146, rewards: 0.8396\n",
      "Iteration: 1680, Train loss: -0.1327, rewards: 0.8338\n",
      "Iteration: 1700, Train loss: -0.1271, rewards: 0.8242\n",
      "Iteration: 1720, Train loss: -0.1184, rewards: 0.8043\n",
      "Iteration: 1740, Train loss: -0.1188, rewards: 0.8349\n",
      "Iteration: 1760, Train loss: -0.1535, rewards: 0.8387\n",
      "Iteration: 1780, Train loss: -0.1910, rewards: 0.8201\n",
      "Iteration: 1800, Train loss: -0.1702, rewards: 0.8094\n",
      "Eval:\n",
      "Hits@1: 0.7938, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8247\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.1303, rewards: 0.8134\n",
      "Iteration: 1840, Train loss: -0.1577, rewards: 0.8261\n",
      "Iteration: 1860, Train loss: -0.0975, rewards: 0.8292\n",
      "Iteration: 1880, Train loss: -0.1500, rewards: 0.8357\n",
      "Iteration: 1900, Train loss: -0.0760, rewards: 0.8199\n",
      "Iteration: 1920, Train loss: -0.1522, rewards: 0.8090\n",
      "Iteration: 1940, Train loss: -0.1380, rewards: 0.8362\n",
      "Iteration: 1960, Train loss: -0.1293, rewards: 0.8425\n",
      "Iteration: 1980, Train loss: -0.1043, rewards: 0.8448\n",
      "Iteration: 2000, Train loss: -0.1470, rewards: 0.8524\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.8557, Hits@10: 0.8557, MRR: 0.8076\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.6696, Hits@3: 0.7679, Hits@10: 0.8125, MRR: 0.7272\n",
      "MINERVA MAP: 0.8701105442176871 (112 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: 0.4952, rewards: 0.5223\n",
      "Iteration: 40, Train loss: 0.5170, rewards: 0.5142\n",
      "Iteration: 60, Train loss: 0.5276, rewards: 0.5227\n",
      "Iteration: 80, Train loss: 0.5048, rewards: 0.5380\n",
      "Iteration: 100, Train loss: 0.5447, rewards: 0.5219\n",
      "Iteration: 120, Train loss: 0.5472, rewards: 0.5199\n",
      "Iteration: 140, Train loss: 0.5349, rewards: 0.5610\n",
      "Iteration: 160, Train loss: 0.5495, rewards: 0.5173\n",
      "Iteration: 180, Train loss: 0.5600, rewards: 0.5434\n",
      "Iteration: 200, Train loss: 0.5666, rewards: 0.5365\n",
      "Eval:\n",
      "Hits@1: 0.5188, Hits@3: 0.5325, Hits@10: 0.5445, MRR: 0.5283\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: 0.5506, rewards: 0.5536\n",
      "Iteration: 240, Train loss: 0.5565, rewards: 0.5260\n",
      "Iteration: 260, Train loss: 0.5488, rewards: 0.5307\n",
      "Iteration: 280, Train loss: 0.5510, rewards: 0.5398\n",
      "Iteration: 300, Train loss: 0.5600, rewards: 0.5418\n",
      "Iteration: 320, Train loss: 0.5604, rewards: 0.5041\n",
      "Iteration: 340, Train loss: 0.5767, rewards: 0.5243\n",
      "Iteration: 360, Train loss: 0.5575, rewards: 0.5500\n",
      "Iteration: 380, Train loss: 0.5907, rewards: 0.5208\n",
      "Iteration: 400, Train loss: 0.5756, rewards: 0.5047\n",
      "Eval:\n",
      "Hits@1: 0.5188, Hits@3: 0.5325, Hits@10: 0.5428, MRR: 0.5266\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: 0.5754, rewards: 0.4982\n",
      "Iteration: 440, Train loss: 0.5645, rewards: 0.5346\n",
      "Iteration: 460, Train loss: 0.5740, rewards: 0.5143\n",
      "Iteration: 480, Train loss: 0.5580, rewards: 0.5268\n",
      "Iteration: 500, Train loss: 0.5579, rewards: 0.5356\n",
      "Iteration: 520, Train loss: 0.5675, rewards: 0.5317\n",
      "Iteration: 540, Train loss: 0.5822, rewards: 0.5332\n",
      "Iteration: 560, Train loss: 0.5725, rewards: 0.5318\n",
      "Iteration: 580, Train loss: 0.5809, rewards: 0.5195\n",
      "Iteration: 600, Train loss: 0.5748, rewards: 0.5256\n",
      "Eval:\n",
      "Hits@1: 0.5188, Hits@3: 0.5325, Hits@10: 0.5428, MRR: 0.5276\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: 0.5897, rewards: 0.5051\n",
      "Iteration: 640, Train loss: 0.5764, rewards: 0.5073\n",
      "Iteration: 660, Train loss: 0.5958, rewards: 0.5029\n",
      "Iteration: 680, Train loss: 0.5908, rewards: 0.5337\n",
      "Iteration: 700, Train loss: 0.5952, rewards: 0.4995\n",
      "Iteration: 720, Train loss: 0.6038, rewards: 0.5134\n",
      "Iteration: 740, Train loss: 0.5855, rewards: 0.5168\n",
      "Iteration: 760, Train loss: 0.6035, rewards: 0.5142\n",
      "Iteration: 780, Train loss: 0.5800, rewards: 0.5324\n",
      "Iteration: 800, Train loss: 0.5896, rewards: 0.5168\n",
      "Eval:\n",
      "Hits@1: 0.5188, Hits@3: 0.5360, Hits@10: 0.5428, MRR: 0.5278\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: 0.5926, rewards: 0.5162\n",
      "Iteration: 840, Train loss: 0.5861, rewards: 0.5377\n",
      "Iteration: 860, Train loss: 0.5746, rewards: 0.5289\n",
      "Iteration: 880, Train loss: 0.5752, rewards: 0.5516\n",
      "Iteration: 900, Train loss: 0.5816, rewards: 0.5346\n",
      "Iteration: 920, Train loss: 0.5863, rewards: 0.5055\n",
      "Iteration: 940, Train loss: 0.5732, rewards: 0.5034\n",
      "Iteration: 960, Train loss: 0.5893, rewards: 0.5198\n",
      "Iteration: 980, Train loss: 0.5862, rewards: 0.5268\n",
      "Iteration: 1000, Train loss: 0.5953, rewards: 0.5234\n",
      "Eval:\n",
      "Hits@1: 0.5240, Hits@3: 0.5308, Hits@10: 0.5428, MRR: 0.5295\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: 0.5891, rewards: 0.5100\n",
      "Iteration: 1040, Train loss: 0.5878, rewards: 0.5557\n",
      "Iteration: 1060, Train loss: 0.5743, rewards: 0.5715\n",
      "Iteration: 1080, Train loss: 0.5947, rewards: 0.5212\n",
      "Iteration: 1100, Train loss: 0.5856, rewards: 0.5223\n",
      "Iteration: 1120, Train loss: 0.5741, rewards: 0.5148\n",
      "Iteration: 1140, Train loss: 0.5962, rewards: 0.5136\n",
      "Iteration: 1160, Train loss: 0.5761, rewards: 0.5277\n",
      "Iteration: 1180, Train loss: 0.5517, rewards: 0.5342\n",
      "Iteration: 1200, Train loss: 0.5863, rewards: 0.5142\n",
      "Eval:\n",
      "Hits@1: 0.5120, Hits@3: 0.5325, Hits@10: 0.5360, MRR: 0.5225\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: 0.5701, rewards: 0.4979\n",
      "Iteration: 1240, Train loss: 0.5663, rewards: 0.5310\n",
      "Iteration: 1260, Train loss: 0.5700, rewards: 0.5364\n",
      "Iteration: 1280, Train loss: 0.5779, rewards: 0.5232\n",
      "Iteration: 1300, Train loss: 0.5838, rewards: 0.5144\n",
      "Iteration: 1320, Train loss: 0.5489, rewards: 0.5355\n",
      "Iteration: 1340, Train loss: 0.5662, rewards: 0.5323\n",
      "Iteration: 1360, Train loss: 0.5547, rewards: 0.5407\n",
      "Iteration: 1380, Train loss: 0.5648, rewards: 0.5139\n",
      "Iteration: 1400, Train loss: 0.5726, rewards: 0.5316\n",
      "Eval:\n",
      "Hits@1: 0.5137, Hits@3: 0.5308, Hits@10: 0.5428, MRR: 0.5247\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: 0.5594, rewards: 0.5491\n",
      "Iteration: 1440, Train loss: 0.5570, rewards: 0.5388\n",
      "Iteration: 1460, Train loss: 0.5486, rewards: 0.5429\n",
      "Iteration: 1480, Train loss: 0.5403, rewards: 0.5455\n",
      "Iteration: 1500, Train loss: 0.5529, rewards: 0.5598\n",
      "Iteration: 1520, Train loss: 0.5720, rewards: 0.5340\n",
      "Iteration: 1540, Train loss: 0.5573, rewards: 0.5247\n",
      "Iteration: 1560, Train loss: 0.5856, rewards: 0.5175\n",
      "Iteration: 1580, Train loss: 0.5731, rewards: 0.5287\n",
      "Iteration: 1600, Train loss: 0.5663, rewards: 0.5127\n",
      "Eval:\n",
      "Hits@1: 0.4692, Hits@3: 0.5325, Hits@10: 0.5394, MRR: 0.5022\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: 0.5504, rewards: 0.5326\n",
      "Iteration: 1640, Train loss: 0.5271, rewards: 0.5298\n",
      "Iteration: 1660, Train loss: 0.5524, rewards: 0.5169\n",
      "Iteration: 1680, Train loss: 0.5493, rewards: 0.5503\n",
      "Iteration: 1700, Train loss: 0.5655, rewards: 0.5300\n",
      "Iteration: 1720, Train loss: 0.5488, rewards: 0.5614\n",
      "Iteration: 1740, Train loss: 0.5592, rewards: 0.5380\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1760, Train loss: 0.5606, rewards: 0.4969\n",
      "Iteration: 1780, Train loss: 0.5758, rewards: 0.5165\n",
      "Iteration: 1800, Train loss: 0.5647, rewards: 0.5267\n",
      "Eval:\n",
      "Hits@1: 0.4007, Hits@3: 0.5342, Hits@10: 0.5428, MRR: 0.4682\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: 0.5750, rewards: 0.5202\n",
      "Iteration: 1840, Train loss: 0.5459, rewards: 0.5321\n",
      "Iteration: 1860, Train loss: 0.5412, rewards: 0.5293\n",
      "Iteration: 1880, Train loss: 0.5575, rewards: 0.5211\n",
      "Iteration: 1900, Train loss: 0.5392, rewards: 0.5103\n",
      "Iteration: 1920, Train loss: 0.5103, rewards: 0.5395\n",
      "Iteration: 1940, Train loss: 0.5517, rewards: 0.5266\n",
      "Iteration: 1960, Train loss: 0.5416, rewards: 0.5327\n",
      "Iteration: 1980, Train loss: 0.5500, rewards: 0.5209\n",
      "Iteration: 2000, Train loss: 0.5303, rewards: 0.5487\n",
      "Eval:\n",
      "Hits@1: 0.3921, Hits@3: 0.5342, Hits@10: 0.5428, MRR: 0.4646\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/athleteplayssport//test_beam/ ]\n",
      "Hits@1: 0.4096, Hits@3: 0.4710, Hits@10: 0.4793, MRR: 0.4392\n",
      "MINERVA MAP: 0.9709508015478165 (603 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.5134, rewards: 0.4173\n",
      "Iteration: 40, Train loss: -0.5470, rewards: 0.4562\n",
      "Iteration: 60, Train loss: -0.4967, rewards: 0.4662\n",
      "Iteration: 80, Train loss: -0.5192, rewards: 0.4646\n",
      "Iteration: 100, Train loss: -0.5765, rewards: 0.4752\n",
      "Iteration: 120, Train loss: -0.5618, rewards: 0.4791\n",
      "Iteration: 140, Train loss: -0.5671, rewards: 0.4689\n",
      "Iteration: 160, Train loss: -0.6258, rewards: 0.4997\n",
      "Iteration: 180, Train loss: -0.6990, rewards: 0.4799\n",
      "Iteration: 200, Train loss: -0.6369, rewards: 0.5176\n",
      "Eval:\n",
      "Hits@1: 0.5273, Hits@3: 0.5441, Hits@10: 0.5735, MRR: 0.5390\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.6624, rewards: 0.5234\n",
      "Iteration: 240, Train loss: -0.6958, rewards: 0.5112\n",
      "Iteration: 260, Train loss: -0.6839, rewards: 0.5173\n",
      "Iteration: 280, Train loss: -0.5987, rewards: 0.5184\n",
      "Iteration: 300, Train loss: -0.6692, rewards: 0.5282\n",
      "Iteration: 320, Train loss: -0.7030, rewards: 0.5103\n",
      "Iteration: 340, Train loss: -0.7117, rewards: 0.5028\n",
      "Iteration: 360, Train loss: -0.7471, rewards: 0.5223\n",
      "Iteration: 380, Train loss: -0.7434, rewards: 0.5210\n",
      "Iteration: 400, Train loss: -0.7353, rewards: 0.4829\n",
      "Eval:\n",
      "Hits@1: 0.5294, Hits@3: 0.5399, Hits@10: 0.5609, MRR: 0.5379\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.7148, rewards: 0.5202\n",
      "Iteration: 440, Train loss: -0.7052, rewards: 0.5175\n",
      "Iteration: 460, Train loss: -0.7359, rewards: 0.5266\n",
      "Iteration: 480, Train loss: -0.8345, rewards: 0.5014\n",
      "Iteration: 500, Train loss: -0.8159, rewards: 0.5214\n",
      "Iteration: 520, Train loss: -0.7792, rewards: 0.4989\n",
      "Iteration: 540, Train loss: -0.7625, rewards: 0.5033\n",
      "Iteration: 560, Train loss: -0.7714, rewards: 0.5161\n",
      "Iteration: 580, Train loss: -0.7515, rewards: 0.5145\n",
      "Iteration: 600, Train loss: -0.7921, rewards: 0.5078\n",
      "Eval:\n",
      "Hits@1: 0.5315, Hits@3: 0.5420, Hits@10: 0.5651, MRR: 0.5409\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.7540, rewards: 0.5213\n",
      "Iteration: 640, Train loss: -0.7674, rewards: 0.5150\n",
      "Iteration: 660, Train loss: -0.7906, rewards: 0.5211\n",
      "Iteration: 680, Train loss: -0.7959, rewards: 0.4962\n",
      "Iteration: 700, Train loss: -0.7738, rewards: 0.5246\n",
      "Iteration: 720, Train loss: -0.7768, rewards: 0.5107\n",
      "Iteration: 740, Train loss: -0.7660, rewards: 0.5184\n",
      "Iteration: 760, Train loss: -0.7254, rewards: 0.5551\n",
      "Iteration: 780, Train loss: -0.8139, rewards: 0.5001\n",
      "Iteration: 800, Train loss: -0.7666, rewards: 0.5184\n",
      "Eval:\n",
      "Hits@1: 0.5357, Hits@3: 0.5420, Hits@10: 0.5651, MRR: 0.5430\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.7921, rewards: 0.5265\n",
      "Iteration: 840, Train loss: -0.7436, rewards: 0.5191\n",
      "Iteration: 860, Train loss: -0.7583, rewards: 0.5294\n",
      "Iteration: 880, Train loss: -0.7895, rewards: 0.5368\n",
      "Iteration: 900, Train loss: -0.8006, rewards: 0.5091\n",
      "Iteration: 920, Train loss: -0.7772, rewards: 0.5194\n",
      "Iteration: 940, Train loss: -0.8013, rewards: 0.5043\n",
      "Iteration: 960, Train loss: -0.8019, rewards: 0.5290\n",
      "Iteration: 980, Train loss: -0.7439, rewards: 0.5264\n",
      "Iteration: 1000, Train loss: -0.7442, rewards: 0.5454\n",
      "Eval:\n",
      "Hits@1: 0.5252, Hits@3: 0.5483, Hits@10: 0.5672, MRR: 0.5383\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.7585, rewards: 0.5229\n",
      "Iteration: 1040, Train loss: -0.7862, rewards: 0.5266\n",
      "Iteration: 1060, Train loss: -0.8050, rewards: 0.5403\n",
      "Iteration: 1080, Train loss: -0.7441, rewards: 0.5026\n",
      "Iteration: 1100, Train loss: -0.7641, rewards: 0.5293\n",
      "Iteration: 1120, Train loss: -0.7493, rewards: 0.5495\n",
      "Iteration: 1140, Train loss: -0.7699, rewards: 0.5372\n",
      "Iteration: 1160, Train loss: -0.7338, rewards: 0.5244\n",
      "Iteration: 1180, Train loss: -0.7394, rewards: 0.5320\n",
      "Iteration: 1200, Train loss: -0.7942, rewards: 0.5251\n",
      "Eval:\n",
      "Hits@1: 0.5126, Hits@3: 0.5462, Hits@10: 0.5630, MRR: 0.5303\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.7255, rewards: 0.5365\n",
      "Iteration: 1240, Train loss: -0.7801, rewards: 0.5141\n",
      "Iteration: 1260, Train loss: -0.7658, rewards: 0.5231\n",
      "Iteration: 1280, Train loss: -0.7723, rewards: 0.5266\n",
      "Iteration: 1300, Train loss: -0.7549, rewards: 0.5323\n",
      "Iteration: 1320, Train loss: -0.7812, rewards: 0.5415\n",
      "Iteration: 1340, Train loss: -0.7479, rewards: 0.5050\n",
      "Iteration: 1360, Train loss: -0.7296, rewards: 0.5340\n",
      "Iteration: 1380, Train loss: -0.7593, rewards: 0.5153\n",
      "Iteration: 1400, Train loss: -0.7529, rewards: 0.5155\n",
      "Eval:\n",
      "Hits@1: 0.5147, Hits@3: 0.5462, Hits@10: 0.5588, MRR: 0.5316\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.7557, rewards: 0.5264\n",
      "Iteration: 1440, Train loss: -0.7657, rewards: 0.5423\n",
      "Iteration: 1460, Train loss: -0.8102, rewards: 0.5257\n",
      "Iteration: 1480, Train loss: -0.7469, rewards: 0.5196\n",
      "Iteration: 1500, Train loss: -0.6966, rewards: 0.5289\n",
      "Iteration: 1520, Train loss: -0.7396, rewards: 0.5202\n",
      "Iteration: 1540, Train loss: -0.7689, rewards: 0.5236\n",
      "Iteration: 1560, Train loss: -0.7626, rewards: 0.5170\n",
      "Iteration: 1580, Train loss: -0.7803, rewards: 0.5188\n",
      "Iteration: 1600, Train loss: -0.7732, rewards: 0.5268\n",
      "Eval:\n",
      "Hits@1: 0.5336, Hits@3: 0.5483, Hits@10: 0.5672, MRR: 0.5435\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.8244, rewards: 0.5373\n",
      "Iteration: 1640, Train loss: -0.7571, rewards: 0.5213\n",
      "Iteration: 1660, Train loss: -0.7794, rewards: 0.5039\n",
      "Iteration: 1680, Train loss: -0.7507, rewards: 0.5108\n",
      "Iteration: 1700, Train loss: -0.7481, rewards: 0.5123\n",
      "Iteration: 1720, Train loss: -0.7661, rewards: 0.5359\n",
      "Iteration: 1740, Train loss: -0.8124, rewards: 0.5230\n",
      "Iteration: 1760, Train loss: -0.7838, rewards: 0.5338\n",
      "Iteration: 1780, Train loss: -0.7907, rewards: 0.5311\n",
      "Iteration: 1800, Train loss: -0.7891, rewards: 0.5204\n",
      "Eval:\n",
      "Hits@1: 0.5378, Hits@3: 0.5483, Hits@10: 0.5651, MRR: 0.5450\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.7674, rewards: 0.5302\n",
      "Iteration: 1840, Train loss: -0.7375, rewards: 0.5339\n",
      "Iteration: 1860, Train loss: -0.8375, rewards: 0.5119\n",
      "Iteration: 1880, Train loss: -0.7875, rewards: 0.5186\n",
      "Iteration: 1900, Train loss: -0.7653, rewards: 0.5504\n",
      "Iteration: 1920, Train loss: -0.7767, rewards: 0.5523\n",
      "Iteration: 1940, Train loss: -0.7759, rewards: 0.5246\n",
      "Iteration: 1960, Train loss: -0.8138, rewards: 0.5020\n",
      "Iteration: 1980, Train loss: -0.7807, rewards: 0.5507\n",
      "Iteration: 2000, Train loss: -0.7737, rewards: 0.5333\n",
      "Eval:\n",
      "Hits@1: 0.5273, Hits@3: 0.5399, Hits@10: 0.5588, MRR: 0.5366\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/organizationhiredperson//test_beam/ ]\n",
      "Hits@1: 0.4588, Hits@3: 0.5412, Hits@10: 0.5741, MRR: 0.5045\n",
      "MINERVA MAP: 0.8538014972190072 (349 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.0009, rewards: 0.5716\n",
      "Iteration: 40, Train loss: 0.0353, rewards: 0.6111\n",
      "Iteration: 60, Train loss: 0.0297, rewards: 0.6183\n",
      "Iteration: 80, Train loss: -0.0334, rewards: 0.6069\n",
      "Iteration: 100, Train loss: -0.0528, rewards: 0.6209\n",
      "Iteration: 120, Train loss: 0.0183, rewards: 0.6021\n",
      "Iteration: 140, Train loss: -0.0364, rewards: 0.6375\n",
      "Iteration: 160, Train loss: -0.0404, rewards: 0.6366\n",
      "Iteration: 180, Train loss: -0.0369, rewards: 0.6533\n",
      "Iteration: 200, Train loss: -0.0547, rewards: 0.6422\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6436, Hits@10: 0.6543, MRR: 0.6285\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.0187, rewards: 0.6786\n",
      "Iteration: 240, Train loss: -0.0153, rewards: 0.6518\n",
      "Iteration: 260, Train loss: -0.0078, rewards: 0.6829\n",
      "Iteration: 280, Train loss: -0.0435, rewards: 0.6743\n",
      "Iteration: 300, Train loss: -0.0332, rewards: 0.6800\n",
      "Iteration: 320, Train loss: -0.0149, rewards: 0.6960\n",
      "Iteration: 340, Train loss: -0.0200, rewards: 0.6905\n",
      "Iteration: 360, Train loss: 0.0170, rewards: 0.6921\n",
      "Iteration: 380, Train loss: -0.0254, rewards: 0.6679\n",
      "Iteration: 400, Train loss: -0.0561, rewards: 0.6668\n",
      "Eval:\n",
      "Hits@1: 0.6277, Hits@3: 0.6436, Hits@10: 0.6543, MRR: 0.6383\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.0426, rewards: 0.6867\n",
      "Iteration: 440, Train loss: -0.0096, rewards: 0.6745\n",
      "Iteration: 460, Train loss: 0.0069, rewards: 0.6691\n",
      "Iteration: 480, Train loss: -0.0046, rewards: 0.6749\n",
      "Iteration: 500, Train loss: -0.0397, rewards: 0.7083\n",
      "Iteration: 520, Train loss: -0.0541, rewards: 0.7200\n",
      "Iteration: 540, Train loss: 0.0582, rewards: 0.7841\n",
      "Iteration: 560, Train loss: 0.1240, rewards: 0.7709\n",
      "Iteration: 580, Train loss: 0.0923, rewards: 0.7908\n",
      "Iteration: 600, Train loss: 0.0716, rewards: 0.8058\n",
      "Eval:\n",
      "Hits@1: 0.7606, Hits@3: 0.7766, Hits@10: 0.7766, MRR: 0.7690\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: 0.0954, rewards: 0.7900\n",
      "Iteration: 640, Train loss: 0.0811, rewards: 0.7889\n",
      "Iteration: 660, Train loss: 0.0829, rewards: 0.7945\n",
      "Iteration: 680, Train loss: 0.1057, rewards: 0.8034\n",
      "Iteration: 700, Train loss: 0.0666, rewards: 0.7979\n",
      "Iteration: 720, Train loss: 0.0912, rewards: 0.7704\n",
      "Iteration: 740, Train loss: 0.1071, rewards: 0.7842\n",
      "Iteration: 760, Train loss: 0.1173, rewards: 0.7639\n",
      "Iteration: 780, Train loss: 0.0877, rewards: 0.7993\n",
      "Iteration: 800, Train loss: 0.1036, rewards: 0.7784\n",
      "Eval:\n",
      "Hits@1: 0.7713, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7757\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: 0.0460, rewards: 0.7973\n",
      "Iteration: 840, Train loss: 0.0835, rewards: 0.8092\n",
      "Iteration: 860, Train loss: 0.1004, rewards: 0.8039\n",
      "Iteration: 880, Train loss: 0.1108, rewards: 0.8125\n",
      "Iteration: 900, Train loss: 0.0815, rewards: 0.8123\n",
      "Iteration: 920, Train loss: 0.1222, rewards: 0.8169\n",
      "Iteration: 940, Train loss: 0.0861, rewards: 0.8071\n",
      "Iteration: 960, Train loss: 0.1093, rewards: 0.8023\n",
      "Iteration: 980, Train loss: 0.0492, rewards: 0.7958\n",
      "Iteration: 1000, Train loss: 0.0961, rewards: 0.8291\n",
      "Eval:\n",
      "Hits@1: 0.7766, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7793\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: 0.1012, rewards: 0.8134\n",
      "Iteration: 1040, Train loss: 0.0650, rewards: 0.7861\n",
      "Iteration: 1060, Train loss: 0.0686, rewards: 0.8010\n",
      "Iteration: 1080, Train loss: 0.1033, rewards: 0.7987\n",
      "Iteration: 1100, Train loss: 0.1275, rewards: 0.8021\n",
      "Iteration: 1120, Train loss: 0.0683, rewards: 0.8024\n",
      "Iteration: 1140, Train loss: 0.1059, rewards: 0.8074\n",
      "Iteration: 1160, Train loss: 0.1126, rewards: 0.7936\n",
      "Iteration: 1180, Train loss: 0.1208, rewards: 0.7810\n",
      "Iteration: 1200, Train loss: 0.1220, rewards: 0.7975\n",
      "Eval:\n",
      "Hits@1: 0.7766, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7793\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: 0.0811, rewards: 0.8193\n",
      "Iteration: 1240, Train loss: 0.0805, rewards: 0.8032\n",
      "Iteration: 1260, Train loss: 0.1508, rewards: 0.8057\n",
      "Iteration: 1280, Train loss: 0.0310, rewards: 0.8114\n",
      "Iteration: 1300, Train loss: 0.0997, rewards: 0.8088\n",
      "Iteration: 1320, Train loss: 0.1000, rewards: 0.7988\n",
      "Iteration: 1340, Train loss: 0.1145, rewards: 0.7879\n",
      "Iteration: 1360, Train loss: 0.1232, rewards: 0.7953\n",
      "Iteration: 1380, Train loss: 0.0993, rewards: 0.7991\n",
      "Iteration: 1400, Train loss: 0.0799, rewards: 0.7789\n",
      "Eval:\n",
      "Hits@1: 0.7660, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7739\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: 0.0762, rewards: 0.7951\n",
      "Iteration: 1440, Train loss: 0.1119, rewards: 0.7995\n",
      "Iteration: 1460, Train loss: 0.1101, rewards: 0.8082\n",
      "Iteration: 1480, Train loss: 0.0481, rewards: 0.8146\n",
      "Iteration: 1500, Train loss: 0.0935, rewards: 0.7883\n",
      "Iteration: 1520, Train loss: 0.0698, rewards: 0.8139\n",
      "Iteration: 1540, Train loss: 0.0628, rewards: 0.7998\n",
      "Iteration: 1560, Train loss: 0.0808, rewards: 0.8114\n",
      "Iteration: 1580, Train loss: 0.0634, rewards: 0.8192\n",
      "Iteration: 1600, Train loss: 0.0717, rewards: 0.8066\n",
      "Eval:\n",
      "Hits@1: 0.7713, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7766\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: 0.1065, rewards: 0.8026\n",
      "Iteration: 1640, Train loss: 0.0744, rewards: 0.8101\n",
      "Iteration: 1660, Train loss: 0.1099, rewards: 0.7992\n",
      "Iteration: 1680, Train loss: 0.1083, rewards: 0.7945\n",
      "Iteration: 1700, Train loss: 0.0442, rewards: 0.8091\n",
      "Iteration: 1720, Train loss: 0.1083, rewards: 0.8010\n",
      "Iteration: 1740, Train loss: 0.0818, rewards: 0.7896\n",
      "Iteration: 1760, Train loss: 0.0552, rewards: 0.7999\n",
      "Iteration: 1780, Train loss: 0.0509, rewards: 0.8027\n",
      "Iteration: 1800, Train loss: 0.1116, rewards: 0.7943\n",
      "Eval:\n",
      "Hits@1: 0.7660, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7739\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: 0.0363, rewards: 0.8080\n",
      "Iteration: 1840, Train loss: 0.0258, rewards: 0.8100\n",
      "Iteration: 1860, Train loss: 0.0665, rewards: 0.8209\n",
      "Iteration: 1880, Train loss: 0.0425, rewards: 0.7969\n",
      "Iteration: 1900, Train loss: 0.0485, rewards: 0.7963\n",
      "Iteration: 1920, Train loss: 0.0342, rewards: 0.8104\n",
      "Iteration: 1940, Train loss: 0.0716, rewards: 0.8209\n",
      "Iteration: 1960, Train loss: 0.1008, rewards: 0.7979\n",
      "Iteration: 1980, Train loss: 0.0603, rewards: 0.7933\n",
      "Iteration: 2000, Train loss: 0.0835, rewards: 0.7858\n",
      "Eval:\n",
      "Hits@1: 0.7766, Hits@3: 0.7819, Hits@10: 0.7819, MRR: 0.7793\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/personborninlocation//test_beam/ ]\n",
      "Hits@1: 0.5389, Hits@3: 0.6736, Hits@10: 0.7202, MRR: 0.6108\n",
      "MINERVA MAP: 0.7679664894690801 (193 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.1797, rewards: 0.5466\n",
      "Iteration: 40, Train loss: -0.2739, rewards: 0.5655\n",
      "Iteration: 60, Train loss: -0.2353, rewards: 0.5782\n",
      "Iteration: 80, Train loss: -0.2635, rewards: 0.6184\n",
      "Iteration: 100, Train loss: -0.2820, rewards: 0.6265\n",
      "Iteration: 120, Train loss: -0.1936, rewards: 0.6217\n",
      "Iteration: 140, Train loss: -0.2573, rewards: 0.6421\n",
      "Iteration: 160, Train loss: -0.2133, rewards: 0.6513\n",
      "Iteration: 180, Train loss: -0.2187, rewards: 0.6102\n",
      "Iteration: 200, Train loss: -0.2314, rewards: 0.6529\n",
      "Eval:\n",
      "Hits@1: 0.6488, Hits@3: 0.6627, Hits@10: 0.6786, MRR: 0.6573\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.2618, rewards: 0.6355\n",
      "Iteration: 240, Train loss: -0.2416, rewards: 0.6839\n",
      "Iteration: 260, Train loss: -0.2079, rewards: 0.6430\n",
      "Iteration: 280, Train loss: -0.2126, rewards: 0.6424\n",
      "Iteration: 300, Train loss: -0.2431, rewards: 0.6395\n",
      "Iteration: 320, Train loss: -0.2310, rewards: 0.6611\n",
      "Iteration: 340, Train loss: -0.2195, rewards: 0.6652\n",
      "Iteration: 360, Train loss: -0.2951, rewards: 0.6584\n",
      "Iteration: 380, Train loss: -0.2449, rewards: 0.6421\n",
      "Iteration: 400, Train loss: -0.2653, rewards: 0.6651\n",
      "Eval:\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hits@1: 0.6607, Hits@3: 0.6706, Hits@10: 0.6806, MRR: 0.6672\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.2787, rewards: 0.6659\n",
      "Iteration: 440, Train loss: -0.2616, rewards: 0.6470\n",
      "Iteration: 460, Train loss: -0.2687, rewards: 0.6775\n",
      "Iteration: 480, Train loss: -0.2700, rewards: 0.6791\n",
      "Iteration: 500, Train loss: -0.2958, rewards: 0.6635\n",
      "Iteration: 520, Train loss: -0.2338, rewards: 0.6529\n",
      "Iteration: 540, Train loss: -0.2167, rewards: 0.6475\n",
      "Iteration: 560, Train loss: -0.3060, rewards: 0.6544\n",
      "Iteration: 580, Train loss: -0.2893, rewards: 0.6489\n",
      "Iteration: 600, Train loss: -0.3164, rewards: 0.6615\n",
      "Eval:\n",
      "Hits@1: 0.6528, Hits@3: 0.6667, Hits@10: 0.6806, MRR: 0.6617\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.3699, rewards: 0.6538\n",
      "Iteration: 640, Train loss: -0.3411, rewards: 0.6684\n",
      "Iteration: 660, Train loss: -0.3189, rewards: 0.6268\n",
      "Iteration: 680, Train loss: -0.3029, rewards: 0.6666\n",
      "Iteration: 700, Train loss: -0.3249, rewards: 0.6596\n",
      "Iteration: 720, Train loss: -0.2766, rewards: 0.6849\n",
      "Iteration: 740, Train loss: -0.2839, rewards: 0.6607\n",
      "Iteration: 760, Train loss: -0.3180, rewards: 0.6572\n",
      "Iteration: 780, Train loss: -0.3274, rewards: 0.6786\n",
      "Iteration: 800, Train loss: -0.2735, rewards: 0.6784\n",
      "Eval:\n",
      "Hits@1: 0.6548, Hits@3: 0.6726, Hits@10: 0.6825, MRR: 0.6655\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.3283, rewards: 0.6663\n",
      "Iteration: 840, Train loss: -0.3420, rewards: 0.6560\n",
      "Iteration: 860, Train loss: -0.2433, rewards: 0.6706\n",
      "Iteration: 880, Train loss: -0.2713, rewards: 0.6677\n",
      "Iteration: 900, Train loss: -0.3374, rewards: 0.6582\n",
      "Iteration: 920, Train loss: -0.2723, rewards: 0.6820\n",
      "Iteration: 940, Train loss: -0.3474, rewards: 0.6738\n",
      "Iteration: 960, Train loss: -0.3355, rewards: 0.6829\n",
      "Iteration: 980, Train loss: -0.3371, rewards: 0.6807\n",
      "Iteration: 1000, Train loss: -0.3653, rewards: 0.6762\n",
      "Eval:\n",
      "Hits@1: 0.6627, Hits@3: 0.6706, Hits@10: 0.6806, MRR: 0.6686\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.3672, rewards: 0.6795\n",
      "Iteration: 1040, Train loss: -0.3731, rewards: 0.6534\n",
      "Iteration: 1060, Train loss: -0.3634, rewards: 0.6631\n",
      "Iteration: 1080, Train loss: -0.3715, rewards: 0.6761\n",
      "Iteration: 1100, Train loss: -0.3378, rewards: 0.6729\n",
      "Iteration: 1120, Train loss: -0.3155, rewards: 0.6715\n",
      "Iteration: 1140, Train loss: -0.3445, rewards: 0.6459\n",
      "Iteration: 1160, Train loss: -0.3241, rewards: 0.7018\n",
      "Iteration: 1180, Train loss: -0.3048, rewards: 0.6987\n",
      "Iteration: 1200, Train loss: -0.3545, rewards: 0.7014\n",
      "Eval:\n",
      "Hits@1: 0.6587, Hits@3: 0.6726, Hits@10: 0.6766, MRR: 0.6669\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.3436, rewards: 0.6617\n",
      "Iteration: 1240, Train loss: -0.3074, rewards: 0.6697\n",
      "Iteration: 1260, Train loss: -0.3099, rewards: 0.6743\n",
      "Iteration: 1280, Train loss: -0.3598, rewards: 0.6729\n",
      "Iteration: 1300, Train loss: -0.3156, rewards: 0.6486\n",
      "Iteration: 1320, Train loss: -0.3540, rewards: 0.6513\n",
      "Iteration: 1340, Train loss: -0.3792, rewards: 0.6904\n",
      "Iteration: 1360, Train loss: -0.3266, rewards: 0.6747\n",
      "Iteration: 1380, Train loss: -0.3712, rewards: 0.6550\n",
      "Iteration: 1400, Train loss: -0.3760, rewards: 0.6622\n",
      "Eval:\n",
      "Hits@1: 0.6627, Hits@3: 0.6746, Hits@10: 0.6885, MRR: 0.6710\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.3599, rewards: 0.6679\n",
      "Iteration: 1440, Train loss: -0.3746, rewards: 0.6658\n",
      "Iteration: 1460, Train loss: -0.4036, rewards: 0.6837\n",
      "Iteration: 1480, Train loss: -0.2479, rewards: 0.6625\n",
      "Iteration: 1500, Train loss: -0.3222, rewards: 0.6580\n",
      "Iteration: 1520, Train loss: -0.3065, rewards: 0.6604\n",
      "Iteration: 1540, Train loss: -0.3871, rewards: 0.6898\n",
      "Iteration: 1560, Train loss: -0.2932, rewards: 0.6640\n",
      "Iteration: 1580, Train loss: -0.2697, rewards: 0.6830\n",
      "Iteration: 1600, Train loss: -0.3535, rewards: 0.6654\n",
      "Eval:\n",
      "Hits@1: 0.6567, Hits@3: 0.6746, Hits@10: 0.6845, MRR: 0.6675\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.3209, rewards: 0.6711\n",
      "Iteration: 1640, Train loss: -0.3906, rewards: 0.6534\n",
      "Iteration: 1660, Train loss: -0.3196, rewards: 0.6529\n",
      "Iteration: 1680, Train loss: -0.3205, rewards: 0.6641\n",
      "Iteration: 1700, Train loss: -0.3849, rewards: 0.6495\n",
      "Iteration: 1720, Train loss: -0.3457, rewards: 0.6581\n",
      "Iteration: 1740, Train loss: -0.3079, rewards: 0.6657\n",
      "Iteration: 1760, Train loss: -0.2942, rewards: 0.6929\n",
      "Iteration: 1780, Train loss: -0.3473, rewards: 0.6893\n",
      "Iteration: 1800, Train loss: -0.3693, rewards: 0.6793\n",
      "Eval:\n",
      "Hits@1: 0.6627, Hits@3: 0.6766, Hits@10: 0.6865, MRR: 0.6708\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.3362, rewards: 0.7023\n",
      "Iteration: 1840, Train loss: -0.3294, rewards: 0.6929\n",
      "Iteration: 1860, Train loss: -0.3522, rewards: 0.6498\n",
      "Iteration: 1880, Train loss: -0.3671, rewards: 0.6879\n",
      "Iteration: 1900, Train loss: -0.3819, rewards: 0.6852\n",
      "Iteration: 1920, Train loss: -0.3545, rewards: 0.6579\n",
      "Iteration: 1940, Train loss: -0.3076, rewards: 0.6792\n",
      "Iteration: 1960, Train loss: -0.2931, rewards: 0.6717\n",
      "Iteration: 1980, Train loss: -0.3297, rewards: 0.6680\n",
      "Iteration: 2000, Train loss: -0.2983, rewards: 0.6968\n",
      "Eval:\n",
      "Hits@1: 0.6647, Hits@3: 0.6786, Hits@10: 0.6845, MRR: 0.6728\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/worksfor//test_beam/ ]\n",
      "Hits@1: 0.5263, Hits@3: 0.7076, Hits@10: 0.7388, MRR: 0.6168\n",
      "MINERVA MAP: 0.8092869224995116 (421 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: 0.0080, rewards: 0.7071\n",
      "Iteration: 40, Train loss: 0.0376, rewards: 0.7133\n",
      "Iteration: 60, Train loss: 0.0314, rewards: 0.7312\n",
      "Iteration: 80, Train loss: 0.0724, rewards: 0.7150\n",
      "Iteration: 100, Train loss: 0.0523, rewards: 0.7277\n",
      "Iteration: 120, Train loss: 0.0407, rewards: 0.7314\n",
      "Iteration: 140, Train loss: 0.1130, rewards: 0.7176\n",
      "Iteration: 160, Train loss: 0.0654, rewards: 0.7454\n",
      "Iteration: 180, Train loss: 0.1240, rewards: 0.7374\n",
      "Iteration: 200, Train loss: 0.1072, rewards: 0.7395\n",
      "Eval:\n",
      "Hits@1: 0.7189, Hits@3: 0.7229, Hits@10: 0.7309, MRR: 0.7225\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: 0.0813, rewards: 0.7690\n",
      "Iteration: 240, Train loss: 0.0863, rewards: 0.7585\n",
      "Iteration: 260, Train loss: 0.0821, rewards: 0.7579\n",
      "Iteration: 280, Train loss: 0.1045, rewards: 0.7535\n",
      "Iteration: 300, Train loss: 0.0992, rewards: 0.7557\n",
      "Iteration: 320, Train loss: 0.1241, rewards: 0.7539\n",
      "Iteration: 340, Train loss: 0.1163, rewards: 0.7700\n",
      "Iteration: 360, Train loss: 0.1294, rewards: 0.7417\n",
      "Iteration: 380, Train loss: 0.1404, rewards: 0.7345\n",
      "Iteration: 400, Train loss: 0.1450, rewards: 0.7536\n",
      "Eval:\n",
      "Hits@1: 0.7229, Hits@3: 0.7269, Hits@10: 0.7269, MRR: 0.7252\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: 0.1487, rewards: 0.7630\n",
      "Iteration: 440, Train loss: 0.1133, rewards: 0.7637\n",
      "Iteration: 460, Train loss: 0.1483, rewards: 0.7507\n",
      "Iteration: 480, Train loss: 0.1329, rewards: 0.7510\n",
      "Iteration: 500, Train loss: 0.1493, rewards: 0.7508\n",
      "Iteration: 520, Train loss: 0.1196, rewards: 0.7588\n",
      "Iteration: 540, Train loss: 0.1580, rewards: 0.7529\n",
      "Iteration: 560, Train loss: 0.1551, rewards: 0.7416\n",
      "Iteration: 580, Train loss: 0.2018, rewards: 0.7641\n",
      "Iteration: 600, Train loss: 0.1519, rewards: 0.7693\n",
      "Eval:\n",
      "Hits@1: 0.7108, Hits@3: 0.7269, Hits@10: 0.7269, MRR: 0.7179\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: 0.1392, rewards: 0.7482\n",
      "Iteration: 640, Train loss: 0.1439, rewards: 0.7612\n",
      "Iteration: 660, Train loss: 0.1570, rewards: 0.7463\n",
      "Iteration: 680, Train loss: 0.1409, rewards: 0.7547\n",
      "Iteration: 700, Train loss: 0.1468, rewards: 0.7346\n",
      "Iteration: 720, Train loss: 0.1518, rewards: 0.7542\n",
      "Iteration: 740, Train loss: 0.1429, rewards: 0.7765\n",
      "Iteration: 760, Train loss: 0.1827, rewards: 0.7382\n",
      "Iteration: 780, Train loss: 0.1423, rewards: 0.7709\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 800, Train loss: 0.1665, rewards: 0.7452\n",
      "Eval:\n",
      "Hits@1: 0.7229, Hits@3: 0.7269, Hits@10: 0.7309, MRR: 0.7250\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: 0.1470, rewards: 0.7489\n",
      "Iteration: 840, Train loss: 0.1451, rewards: 0.7557\n",
      "Iteration: 860, Train loss: 0.1503, rewards: 0.7484\n",
      "Iteration: 880, Train loss: 0.1159, rewards: 0.7508\n",
      "Iteration: 900, Train loss: 0.0807, rewards: 0.7672\n",
      "Iteration: 920, Train loss: 0.0854, rewards: 0.7465\n",
      "Iteration: 940, Train loss: 0.1004, rewards: 0.7599\n",
      "Iteration: 960, Train loss: 0.0037, rewards: 0.7776\n",
      "Iteration: 980, Train loss: 0.0727, rewards: 0.7395\n",
      "Iteration: 1000, Train loss: 0.0433, rewards: 0.7364\n",
      "Eval:\n",
      "Hits@1: 0.7229, Hits@3: 0.7309, Hits@10: 0.7309, MRR: 0.7265\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: 0.0656, rewards: 0.7704\n",
      "Iteration: 1040, Train loss: 0.0787, rewards: 0.7488\n",
      "Iteration: 1060, Train loss: 0.0816, rewards: 0.7616\n",
      "Iteration: 1080, Train loss: 0.0439, rewards: 0.7647\n",
      "Iteration: 1100, Train loss: 0.0830, rewards: 0.7793\n",
      "Iteration: 1120, Train loss: 0.0773, rewards: 0.7646\n",
      "Iteration: 1140, Train loss: 0.0376, rewards: 0.7598\n",
      "Iteration: 1160, Train loss: 0.0955, rewards: 0.7595\n",
      "Iteration: 1180, Train loss: 0.0534, rewards: 0.7620\n",
      "Iteration: 1200, Train loss: 0.0281, rewards: 0.7620\n",
      "Eval:\n",
      "Hits@1: 0.7229, Hits@3: 0.7309, Hits@10: 0.7309, MRR: 0.7262\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: 0.0382, rewards: 0.7584\n",
      "Iteration: 1240, Train loss: 0.0581, rewards: 0.7575\n",
      "Iteration: 1260, Train loss: 0.0488, rewards: 0.7416\n",
      "Iteration: 1280, Train loss: -0.0146, rewards: 0.7631\n",
      "Iteration: 1300, Train loss: 0.0082, rewards: 0.7584\n",
      "Iteration: 1320, Train loss: 0.0752, rewards: 0.7513\n",
      "Iteration: 1340, Train loss: 0.0205, rewards: 0.7661\n",
      "Iteration: 1360, Train loss: 0.0626, rewards: 0.7486\n",
      "Iteration: 1380, Train loss: 0.0893, rewards: 0.7589\n",
      "Iteration: 1400, Train loss: 0.0516, rewards: 0.7621\n",
      "Eval:\n",
      "Hits@1: 0.7229, Hits@3: 0.7309, Hits@10: 0.7349, MRR: 0.7266\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: 0.1080, rewards: 0.7455\n",
      "Iteration: 1440, Train loss: 0.0822, rewards: 0.7514\n",
      "Iteration: 1460, Train loss: 0.0633, rewards: 0.7416\n",
      "Iteration: 1480, Train loss: 0.0322, rewards: 0.7689\n",
      "Iteration: 1500, Train loss: 0.0006, rewards: 0.7681\n",
      "Iteration: 1520, Train loss: -0.0187, rewards: 0.7350\n",
      "Iteration: 1540, Train loss: 0.0290, rewards: 0.7525\n",
      "Iteration: 1560, Train loss: 0.0055, rewards: 0.7724\n",
      "Iteration: 1580, Train loss: 0.0436, rewards: 0.7588\n",
      "Iteration: 1600, Train loss: 0.0740, rewards: 0.7547\n",
      "Eval:\n",
      "Hits@1: 0.7269, Hits@3: 0.7309, Hits@10: 0.7349, MRR: 0.7293\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.0270, rewards: 0.7446\n",
      "Iteration: 1640, Train loss: 0.0650, rewards: 0.7620\n",
      "Iteration: 1660, Train loss: 0.0747, rewards: 0.7551\n",
      "Iteration: 1680, Train loss: -0.0683, rewards: 0.7726\n",
      "Iteration: 1700, Train loss: 0.0490, rewards: 0.7491\n",
      "Iteration: 1720, Train loss: 0.0485, rewards: 0.7482\n",
      "Iteration: 1740, Train loss: 0.0201, rewards: 0.7754\n",
      "Iteration: 1760, Train loss: 0.0231, rewards: 0.7528\n",
      "Iteration: 1780, Train loss: 0.0704, rewards: 0.7429\n",
      "Iteration: 1800, Train loss: 0.0160, rewards: 0.7553\n",
      "Eval:\n",
      "Hits@1: 0.7269, Hits@3: 0.7349, Hits@10: 0.7349, MRR: 0.7303\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: 0.0404, rewards: 0.7759\n",
      "Iteration: 1840, Train loss: 0.0269, rewards: 0.7632\n",
      "Iteration: 1860, Train loss: 0.0955, rewards: 0.7554\n",
      "Iteration: 1880, Train loss: 0.0438, rewards: 0.7590\n",
      "Iteration: 1900, Train loss: 0.0284, rewards: 0.7501\n",
      "Iteration: 1920, Train loss: 0.0545, rewards: 0.7474\n",
      "Iteration: 1940, Train loss: -0.0023, rewards: 0.7274\n",
      "Iteration: 1960, Train loss: 0.0548, rewards: 0.7672\n",
      "Iteration: 1980, Train loss: -0.0117, rewards: 0.7729\n",
      "Iteration: 2000, Train loss: 0.0364, rewards: 0.7621\n",
      "Eval:\n",
      "Hits@1: 0.7269, Hits@3: 0.7349, Hits@10: 0.7349, MRR: 0.7309\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/organizationheadquarteredincity//test_beam/ ]\n",
      "Hits@1: 0.7349, Hits@3: 0.8112, Hits@10: 0.8434, MRR: 0.7768\n",
      "MINERVA MAP: 0.9370864410021037 (249 queries evaluated)\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 20, Train loss: -0.4414, rewards: 0.6148\n",
      "Iteration: 40, Train loss: -0.4095, rewards: 0.6450\n",
      "Iteration: 60, Train loss: -0.4388, rewards: 0.6692\n",
      "Iteration: 80, Train loss: -0.4370, rewards: 0.6770\n",
      "Iteration: 100, Train loss: -0.4696, rewards: 0.6821\n",
      "Iteration: 120, Train loss: -0.4381, rewards: 0.6705\n",
      "Iteration: 140, Train loss: -0.4497, rewards: 0.6799\n",
      "Iteration: 160, Train loss: -0.4128, rewards: 0.6938\n",
      "Iteration: 180, Train loss: -0.4358, rewards: 0.6866\n",
      "Iteration: 200, Train loss: -0.4558, rewards: 0.6897\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7051, Hits@10: 0.7051, MRR: 0.7006\n",
      "------------------------------------------------------------\n",
      "Iteration: 220, Train loss: -0.3944, rewards: 0.7240\n",
      "Iteration: 240, Train loss: -0.3977, rewards: 0.7151\n",
      "Iteration: 260, Train loss: -0.4757, rewards: 0.6980\n",
      "Iteration: 280, Train loss: -0.4612, rewards: 0.6971\n",
      "Iteration: 300, Train loss: -0.4690, rewards: 0.7071\n",
      "Iteration: 320, Train loss: -0.4327, rewards: 0.6946\n",
      "Iteration: 340, Train loss: -0.4845, rewards: 0.6925\n",
      "Iteration: 360, Train loss: -0.4777, rewards: 0.6878\n",
      "Iteration: 380, Train loss: -0.4178, rewards: 0.7160\n",
      "Iteration: 400, Train loss: -0.4376, rewards: 0.7151\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7051, Hits@10: 0.7051, MRR: 0.7030\n",
      "------------------------------------------------------------\n",
      "Iteration: 420, Train loss: -0.4445, rewards: 0.7137\n",
      "Iteration: 440, Train loss: -0.4779, rewards: 0.7106\n",
      "Iteration: 460, Train loss: -0.4615, rewards: 0.7203\n",
      "Iteration: 480, Train loss: -0.4948, rewards: 0.7008\n",
      "Iteration: 500, Train loss: -0.4583, rewards: 0.7062\n",
      "Iteration: 520, Train loss: -0.4645, rewards: 0.7052\n",
      "Iteration: 540, Train loss: -0.5122, rewards: 0.7139\n",
      "Iteration: 560, Train loss: -0.4896, rewards: 0.7084\n",
      "Iteration: 580, Train loss: -0.4418, rewards: 0.7036\n",
      "Iteration: 600, Train loss: -0.5069, rewards: 0.7085\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7051, Hits@10: 0.7051, MRR: 0.7028\n",
      "------------------------------------------------------------\n",
      "Iteration: 620, Train loss: -0.4556, rewards: 0.7257\n",
      "Iteration: 640, Train loss: -0.4358, rewards: 0.7264\n",
      "Iteration: 660, Train loss: -0.3824, rewards: 0.6912\n",
      "Iteration: 680, Train loss: -0.4386, rewards: 0.7128\n",
      "Iteration: 700, Train loss: -0.4427, rewards: 0.7295\n",
      "Iteration: 720, Train loss: -0.4325, rewards: 0.7083\n",
      "Iteration: 740, Train loss: -0.4513, rewards: 0.6961\n",
      "Iteration: 760, Train loss: -0.4822, rewards: 0.7041\n",
      "Iteration: 780, Train loss: -0.4516, rewards: 0.7155\n",
      "Iteration: 800, Train loss: -0.5027, rewards: 0.7211\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7076\n",
      "------------------------------------------------------------\n",
      "Iteration: 820, Train loss: -0.4862, rewards: 0.7371\n",
      "Iteration: 840, Train loss: -0.4442, rewards: 0.7159\n",
      "Iteration: 860, Train loss: -0.4202, rewards: 0.6918\n",
      "Iteration: 880, Train loss: -0.5220, rewards: 0.6901\n",
      "Iteration: 900, Train loss: -0.4891, rewards: 0.7328\n",
      "Iteration: 920, Train loss: -0.4936, rewards: 0.7314\n",
      "Iteration: 940, Train loss: -0.5005, rewards: 0.7173\n",
      "Iteration: 960, Train loss: -0.5538, rewards: 0.7111\n",
      "Iteration: 980, Train loss: -0.4449, rewards: 0.7119\n",
      "Iteration: 1000, Train loss: -0.5197, rewards: 0.6970\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7100\n",
      "------------------------------------------------------------\n",
      "Iteration: 1020, Train loss: -0.4911, rewards: 0.7074\n",
      "Iteration: 1040, Train loss: -0.4591, rewards: 0.6988\n",
      "Iteration: 1060, Train loss: -0.5158, rewards: 0.6975\n",
      "Iteration: 1080, Train loss: -0.4760, rewards: 0.7153\n",
      "Iteration: 1100, Train loss: -0.5176, rewards: 0.7246\n",
      "Iteration: 1120, Train loss: -0.4961, rewards: 0.7147\n",
      "Iteration: 1140, Train loss: -0.4999, rewards: 0.7121\n",
      "Iteration: 1160, Train loss: -0.4779, rewards: 0.7126\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1180, Train loss: -0.4911, rewards: 0.7190\n",
      "Iteration: 1200, Train loss: -0.4628, rewards: 0.7248\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7097\n",
      "------------------------------------------------------------\n",
      "Iteration: 1220, Train loss: -0.4195, rewards: 0.7398\n",
      "Iteration: 1240, Train loss: -0.5191, rewards: 0.7090\n",
      "Iteration: 1260, Train loss: -0.5008, rewards: 0.7191\n",
      "Iteration: 1280, Train loss: -0.4641, rewards: 0.7084\n",
      "Iteration: 1300, Train loss: -0.4656, rewards: 0.7539\n",
      "Iteration: 1320, Train loss: -0.4700, rewards: 0.7061\n",
      "Iteration: 1340, Train loss: -0.4958, rewards: 0.7184\n",
      "Iteration: 1360, Train loss: -0.5123, rewards: 0.7196\n",
      "Iteration: 1380, Train loss: -0.4457, rewards: 0.7429\n",
      "Iteration: 1400, Train loss: -0.4670, rewards: 0.7270\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7069\n",
      "------------------------------------------------------------\n",
      "Iteration: 1420, Train loss: -0.5041, rewards: 0.7201\n",
      "Iteration: 1440, Train loss: -0.5172, rewards: 0.6975\n",
      "Iteration: 1460, Train loss: -0.5004, rewards: 0.7009\n",
      "Iteration: 1480, Train loss: -0.4826, rewards: 0.7170\n",
      "Iteration: 1500, Train loss: -0.4238, rewards: 0.7375\n",
      "Iteration: 1520, Train loss: -0.5085, rewards: 0.7173\n",
      "Iteration: 1540, Train loss: -0.4922, rewards: 0.7319\n",
      "Iteration: 1560, Train loss: -0.4953, rewards: 0.7160\n",
      "Iteration: 1580, Train loss: -0.4434, rewards: 0.7048\n",
      "Iteration: 1600, Train loss: -0.4971, rewards: 0.7225\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7099\n",
      "------------------------------------------------------------\n",
      "Iteration: 1620, Train loss: -0.4746, rewards: 0.7225\n",
      "Iteration: 1640, Train loss: -0.4868, rewards: 0.7321\n",
      "Iteration: 1660, Train loss: -0.4751, rewards: 0.7275\n",
      "Iteration: 1680, Train loss: -0.4667, rewards: 0.7147\n",
      "Iteration: 1700, Train loss: -0.5284, rewards: 0.6907\n",
      "Iteration: 1720, Train loss: -0.4859, rewards: 0.7204\n",
      "Iteration: 1740, Train loss: -0.5150, rewards: 0.7205\n",
      "Iteration: 1760, Train loss: -0.5260, rewards: 0.7254\n",
      "Iteration: 1780, Train loss: -0.5127, rewards: 0.7202\n",
      "Iteration: 1800, Train loss: -0.4874, rewards: 0.7151\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7100\n",
      "------------------------------------------------------------\n",
      "Iteration: 1820, Train loss: -0.5096, rewards: 0.7120\n",
      "Iteration: 1840, Train loss: -0.4806, rewards: 0.7235\n",
      "Iteration: 1860, Train loss: -0.5923, rewards: 0.6973\n",
      "Iteration: 1880, Train loss: -0.4805, rewards: 0.7234\n",
      "Iteration: 1900, Train loss: -0.5488, rewards: 0.7395\n",
      "Iteration: 1920, Train loss: -0.5396, rewards: 0.7092\n",
      "Iteration: 1940, Train loss: -0.4318, rewards: 0.7008\n",
      "Iteration: 1960, Train loss: -0.5393, rewards: 0.7291\n",
      "Iteration: 1980, Train loss: -0.4928, rewards: 0.7081\n",
      "Iteration: 2000, Train loss: -0.5472, rewards: 0.6877\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7097\n",
      "------------------------------------------------------------\n",
      "INFO:root:[ printing paths at ./outputs_NELL-sub-tune/personleadsorganization//test_beam/ ]\n",
      "Hits@1: 0.6422, Hits@3: 0.7457, Hits@10: 0.7629, MRR: 0.6933\n",
      "MINERVA MAP: 0.8691895389264657 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "from model.ours2 import *\n",
    "\n",
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "\n",
    "results_collect = {}\n",
    "for sub_task in sub_tasks_list:\n",
    "    params = set_params(1, 64, 0.1, 0.1, 0.0001, sub_task.lower().strip())\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    \n",
    "    save_path = sub_trainer.save_path\n",
    "    output_dir = sub_trainer.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_trainer.test_environment = sub_trainer.test_test_environment\n",
    "    sub_trainer.test_environment.test_rollouts = 100\n",
    "    test_results = sub_trainer.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/{sub_task.lower().strip()}'\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", sub_trainer.data_input_dir+'/sort_test.pairs')\n",
    "    results_collect[sub_task] = MAP\n",
    "    \n",
    "    del sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "90494531",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'AthletePlaysInLeague': 0.9727471566054243,\n",
       " 'AthletePlaysForTeam ': 0.8109486336230524,\n",
       " 'AthleteHomeStadium ': 0.9133484812589291,\n",
       " 'TeamPlaysSport': 0.8701105442176871,\n",
       " 'AthletePlaysSport': 0.9709508015478165,\n",
       " 'OrganizationHiredPerson': 0.8538014972190072,\n",
       " 'PersonBornInLocation': 0.7679664894690801,\n",
       " 'WorksFor': 0.8092869224995116,\n",
       " 'organizationheadquarteredincity': 0.9370864410021037,\n",
       " 'PersonLeadsOrganization': 0.8691895389264657}"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "results_collect"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
