{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "b2479ab1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-a0bf155a-639b-5746-92c8-243d8972b5a9\"\n",
    "\n",
    "from model.ours3 import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "a39d5a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    \n",
    "    options['use_cuda'] = True\n",
    "    options['vocab_dir'] = '../MINERVA/datasets/data_preprocessed/nell/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_nell995-1/'\n",
    "        options['output_dir'] = './outputs_nell995-1/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_nell995-1/'\n",
    "        options['model_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = 1\n",
    "    options['max_num_actions'] = 40\n",
    "    options['gnn_layer'] = 2\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 40\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = 64\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = 0.15\n",
    "    options['Lambda'] = 0.15\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = 0.00005\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 5\n",
    "    options['total_iterations'] = 20*(64/options['batch_size'])\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "12f1b8ba",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n"
     ]
    }
   ],
   "source": [
    "params = set_params()\n",
    "params['test_rollouts'] = 100\n",
    "params['max_num_actions'] = 100\n",
    "params['eval_batch_size'] = 8\n",
    "\n",
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "17bc5425",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8207787473535506 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6278593427818233 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.572523027000639 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8249362244897959 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9319237147595357 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.9153204137843777 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.8065181795751745 (193 queries evaluated)\n",
      "WorksFor.txt\n",
      "MINERVA MAP: 0.8287528177373783 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.9408317251690747 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8386739927983896 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "map_list = {}    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "    \n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    map_list[sub_task] = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              trainer.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "10a372ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "import optuna\n",
    "from model.ours3 import *\n",
    "global sub_tasks_list\n",
    "\n",
    "\n",
    "sub_tasks_list = [\n",
    "# 'AthletePlaysInLeague',\n",
    "# 'AthletePlaysForTeam ',\n",
    "#'AthleteHomeStadium '\n",
    "#'TeamPlaysSport',\n",
    "# 'AthletePlaysSport',\n",
    "# 'OrganizationHiredPerson',\n",
    "'PersonBornInLocation'\n",
    "# 'WorksFor',\n",
    "# 'organizationheadquarteredincity',\n",
    "#'PersonLeadsOrganization'\n",
    "]\n",
    "\n",
    "def objective(trial):\n",
    "    \n",
    "    sub_task = sub_tasks_list[0]\n",
    "\n",
    "    lr = trial.suggest_float('lr', 1e-6, 1e-2)\n",
    "    bs = trial.suggest_int('bs', 4, 128)\n",
    "    b = trial.suggest_float('b', 0, 0.5)\n",
    "    l = trial.suggest_float('l', 0, 0.5)\n",
    "    ee = trial.suggest_categorical('ee', [10,20,50,100])\n",
    "\n",
    "    params = set_params(sub_task.lower().strip())\n",
    "    params['learning_rate'] = lr\n",
    "    params['eval_every'] = ee\n",
    "    params['batch_size'] = bs\n",
    "    params['beta'] = b\n",
    "    params['Lambda'] = l\n",
    "    params['total_iterations'] = min(50*params['eval_every'], 2000)\n",
    "\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    #     torch.save(sub_trainer.agent.state_dict(), params['model_dir'] + 'tmp.ckpt')\n",
    "\n",
    "    params['test_rollouts'] = 100\n",
    "    params['max_num_actions'] = 100\n",
    "    params['eval_batch_size'] = 8\n",
    "\n",
    "    sub_tester = Trainer(params)\n",
    "    sub_tester.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_tester.agent.eval()\n",
    "\n",
    "    save_path = sub_tester.save_path\n",
    "    output_dir = sub_tester.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_tester.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_tester.test_environment = sub_tester.test_test_environment\n",
    "    test_results = sub_tester.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_tester.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "\n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              sub_tester.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')\n",
    "\n",
    "    del sub_tester, sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()\n",
    "    \n",
    "    return MAP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ae521015",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:11:15,785]\u001b[0m A new study created in RDB with name: PersonBornInLocation\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.0240, rewards: 0.3281\n",
      "Iteration: 10, Train loss: -0.0030, rewards: 0.4985\n",
      "Iteration: 15, Train loss: -0.0000, rewards: 0.6119\n",
      "Iteration: 20, Train loss: -0.0025, rewards: 0.5910\n",
      "Iteration: 25, Train loss: -0.0012, rewards: 0.5761\n",
      "Iteration: 30, Train loss: -0.0002, rewards: 0.2239\n",
      "Iteration: 35, Train loss: -0.0010, rewards: 0.4179\n",
      "Iteration: 40, Train loss: -0.0008, rewards: 0.5522\n",
      "Iteration: 45, Train loss: -0.0000, rewards: 0.5403\n",
      "Iteration: 50, Train loss: -0.0943, rewards: 0.5552\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5372, Hits@10: 0.5372, MRR: 0.5236\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.0050, rewards: 0.5552\n",
      "Iteration: 60, Train loss: -0.0157, rewards: 0.6000\n",
      "Iteration: 65, Train loss: -0.0143, rewards: 0.5403\n",
      "Iteration: 70, Train loss: -0.0136, rewards: 0.5522\n",
      "Iteration: 75, Train loss: -0.0088, rewards: 0.5761\n",
      "Iteration: 80, Train loss: -0.0109, rewards: 0.5403\n",
      "Iteration: 85, Train loss: -0.0132, rewards: 0.5373\n",
      "Iteration: 90, Train loss: -0.0200, rewards: 0.5552\n",
      "Iteration: 95, Train loss: -0.0154, rewards: 0.5373\n",
      "Iteration: 100, Train loss: -0.0159, rewards: 0.4060\n",
      "Eval:\n",
      "Hits@1: 0.2713, Hits@3: 0.4415, Hits@10: 0.6223, MRR: 0.3851\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: 0.0024, rewards: 0.0399\n",
      "Iteration: 110, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 115, Train loss: -0.0011, rewards: 0.1194\n",
      "Iteration: 120, Train loss: -0.0017, rewards: 0.1970\n",
      "Iteration: 125, Train loss: -0.0015, rewards: 0.5313\n",
      "Iteration: 130, Train loss: -0.0118, rewards: 0.5061\n",
      "Iteration: 135, Train loss: -0.0164, rewards: 0.4836\n",
      "Iteration: 140, Train loss: -0.0095, rewards: 0.5582\n",
      "Iteration: 145, Train loss: -0.0107, rewards: 0.5463\n",
      "Iteration: 150, Train loss: -0.0183, rewards: 0.5522\n",
      "Eval:\n",
      "Hits@1: 0.5053, Hits@3: 0.5266, Hits@10: 0.5479, MRR: 0.5189\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.0181, rewards: 0.4836\n",
      "Iteration: 160, Train loss: -0.0147, rewards: 0.5463\n",
      "Iteration: 165, Train loss: -0.0065, rewards: 0.5731\n",
      "Iteration: 170, Train loss: -0.0114, rewards: 0.5791\n",
      "Iteration: 175, Train loss: -0.0211, rewards: 0.5672\n",
      "Iteration: 180, Train loss: -0.0174, rewards: 0.5045\n",
      "Iteration: 185, Train loss: -0.0176, rewards: 0.5403\n",
      "Iteration: 190, Train loss: -0.0262, rewards: 0.5343\n",
      "Iteration: 195, Train loss: -0.0178, rewards: 0.5522\n",
      "Iteration: 200, Train loss: -0.0168, rewards: 0.5104\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5212\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.0235, rewards: 0.5343\n",
      "Iteration: 210, Train loss: -0.0218, rewards: 0.5672\n",
      "Iteration: 215, Train loss: -0.0233, rewards: 0.5343\n",
      "Iteration: 220, Train loss: -0.0232, rewards: 0.4836\n",
      "Iteration: 225, Train loss: -0.0181, rewards: 0.5373\n",
      "Iteration: 230, Train loss: -0.0189, rewards: 0.5642\n",
      "Iteration: 235, Train loss: -0.0293, rewards: 0.5224\n",
      "Iteration: 240, Train loss: -0.0142, rewards: 0.5254\n",
      "Iteration: 245, Train loss: -0.0247, rewards: 0.5493\n",
      "Iteration: 250, Train loss: -0.0251, rewards: 0.5433\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.0200, rewards: 0.5433\n",
      "Iteration: 260, Train loss: -0.0233, rewards: 0.5075\n",
      "Iteration: 265, Train loss: -0.0247, rewards: 0.4776\n",
      "Iteration: 270, Train loss: -0.0140, rewards: 0.4507\n",
      "Iteration: 275, Train loss: -0.0281, rewards: 0.4955\n",
      "Iteration: 280, Train loss: -0.0217, rewards: 0.4955\n",
      "Iteration: 285, Train loss: -0.0175, rewards: 0.5045\n",
      "Iteration: 290, Train loss: -0.0223, rewards: 0.5612\n",
      "Iteration: 295, Train loss: -0.0186, rewards: 0.5522\n",
      "Iteration: 300, Train loss: -0.0196, rewards: 0.5075\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.0242, rewards: 0.5284\n",
      "Iteration: 310, Train loss: -0.0182, rewards: 0.5045\n",
      "Iteration: 315, Train loss: -0.0199, rewards: 0.4925\n",
      "Iteration: 320, Train loss: -0.0170, rewards: 0.4627\n",
      "Iteration: 325, Train loss: -0.0319, rewards: 0.5463\n",
      "Iteration: 330, Train loss: -0.0209, rewards: 0.5522\n",
      "Iteration: 335, Train loss: -0.0231, rewards: 0.5373\n",
      "Iteration: 340, Train loss: -0.0244, rewards: 0.5045\n",
      "Iteration: 345, Train loss: -0.0111, rewards: 0.5493\n",
      "Iteration: 350, Train loss: -0.0134, rewards: 0.5075\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -0.0176, rewards: 0.5015\n",
      "Iteration: 360, Train loss: -0.0226, rewards: 0.5403\n",
      "Iteration: 365, Train loss: -0.0218, rewards: 0.4985\n",
      "Iteration: 370, Train loss: -0.0207, rewards: 0.5134\n",
      "Iteration: 375, Train loss: -0.0176, rewards: 0.5522\n",
      "Iteration: 380, Train loss: -0.0202, rewards: 0.5313\n",
      "Iteration: 385, Train loss: -0.0249, rewards: 0.5104\n",
      "Iteration: 390, Train loss: -0.0203, rewards: 0.5433\n",
      "Iteration: 395, Train loss: -0.0173, rewards: 0.5075\n",
      "Iteration: 400, Train loss: -0.0277, rewards: 0.5522\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -0.0151, rewards: 0.5493\n",
      "Iteration: 410, Train loss: -0.0178, rewards: 0.5224\n",
      "Iteration: 415, Train loss: -0.0143, rewards: 0.5313\n",
      "Iteration: 420, Train loss: -0.0167, rewards: 0.5224\n",
      "Iteration: 425, Train loss: -0.0159, rewards: 0.5343\n",
      "Iteration: 430, Train loss: -0.0227, rewards: 0.5164\n",
      "Iteration: 435, Train loss: -0.0205, rewards: 0.5791\n",
      "Iteration: 440, Train loss: -0.0287, rewards: 0.5493\n",
      "Iteration: 445, Train loss: -0.0157, rewards: 0.5343\n",
      "Iteration: 450, Train loss: -0.0116, rewards: 0.5403\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -0.0216, rewards: 0.5433\n",
      "Iteration: 460, Train loss: -0.0136, rewards: 0.5104\n",
      "Iteration: 465, Train loss: -0.0190, rewards: 0.4925\n",
      "Iteration: 470, Train loss: -0.0255, rewards: 0.5731\n",
      "Iteration: 475, Train loss: -0.0152, rewards: 0.5522\n",
      "Iteration: 480, Train loss: -0.0151, rewards: 0.5612\n",
      "Iteration: 485, Train loss: -0.0191, rewards: 0.5791\n",
      "Iteration: 490, Train loss: -0.0136, rewards: 0.5701\n",
      "Iteration: 495, Train loss: -0.0194, rewards: 0.5522\n",
      "Iteration: 500, Train loss: -0.0135, rewards: 0.5134\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -0.0244, rewards: 0.5582\n",
      "Iteration: 510, Train loss: -0.0205, rewards: 0.5642\n",
      "Iteration: 515, Train loss: -0.0235, rewards: 0.5522\n",
      "Iteration: 520, Train loss: -0.0185, rewards: 0.5343\n",
      "Iteration: 525, Train loss: -0.0199, rewards: 0.5403\n",
      "Iteration: 530, Train loss: -0.0223, rewards: 0.5582\n",
      "Iteration: 535, Train loss: -0.0259, rewards: 0.5851\n",
      "Iteration: 540, Train loss: -0.0180, rewards: 0.4925\n",
      "Iteration: 545, Train loss: -0.0178, rewards: 0.4597\n",
      "Iteration: 550, Train loss: -0.0160, rewards: 0.5493\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -0.0209, rewards: 0.5731\n",
      "Iteration: 560, Train loss: -0.0250, rewards: 0.5403\n",
      "Iteration: 565, Train loss: -0.0150, rewards: 0.5821\n",
      "Iteration: 570, Train loss: -0.0178, rewards: 0.5522\n",
      "Iteration: 575, Train loss: -0.0128, rewards: 0.5134\n",
      "Iteration: 580, Train loss: -0.0072, rewards: 0.5343\n",
      "Iteration: 585, Train loss: -0.0173, rewards: 0.4985\n",
      "Iteration: 590, Train loss: -0.0193, rewards: 0.5254\n",
      "Iteration: 595, Train loss: -0.0151, rewards: 0.5313\n",
      "Iteration: 600, Train loss: -0.0268, rewards: 0.5791\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -0.0211, rewards: 0.5254\n",
      "Iteration: 610, Train loss: -0.0280, rewards: 0.5224\n",
      "Iteration: 615, Train loss: -0.0239, rewards: 0.5642\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -0.0148, rewards: 0.4836\n",
      "Iteration: 625, Train loss: -0.0189, rewards: 0.5373\n",
      "Iteration: 630, Train loss: -0.0179, rewards: 0.6060\n",
      "Iteration: 635, Train loss: -0.0202, rewards: 0.5104\n",
      "Iteration: 640, Train loss: -0.0155, rewards: 0.5254\n",
      "Iteration: 645, Train loss: -0.0264, rewards: 0.5403\n",
      "Iteration: 650, Train loss: -0.0221, rewards: 0.5761\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -0.0143, rewards: 0.5761\n",
      "Iteration: 660, Train loss: -0.0228, rewards: 0.4836\n",
      "Iteration: 665, Train loss: -0.0210, rewards: 0.5403\n",
      "Iteration: 670, Train loss: -0.0193, rewards: 0.5164\n",
      "Iteration: 675, Train loss: -0.0149, rewards: 0.5313\n",
      "Iteration: 680, Train loss: -0.0182, rewards: 0.5642\n",
      "Iteration: 685, Train loss: -0.0253, rewards: 0.4836\n",
      "Iteration: 690, Train loss: -0.0177, rewards: 0.5552\n",
      "Iteration: 695, Train loss: -0.0146, rewards: 0.5582\n",
      "Iteration: 700, Train loss: -0.0177, rewards: 0.5164\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -0.0139, rewards: 0.5672\n",
      "Iteration: 710, Train loss: -0.0238, rewards: 0.4836\n",
      "Iteration: 715, Train loss: -0.0214, rewards: 0.5075\n",
      "Iteration: 720, Train loss: -0.0192, rewards: 0.5522\n",
      "Iteration: 725, Train loss: -0.0250, rewards: 0.5373\n",
      "Iteration: 730, Train loss: -0.0181, rewards: 0.5463\n",
      "Iteration: 735, Train loss: -0.0242, rewards: 0.5582\n",
      "Iteration: 740, Train loss: -0.0230, rewards: 0.5343\n",
      "Iteration: 745, Train loss: -0.0173, rewards: 0.5343\n",
      "Iteration: 750, Train loss: -0.0209, rewards: 0.5910\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.0229, rewards: 0.5552\n",
      "Iteration: 760, Train loss: -0.0156, rewards: 0.5373\n",
      "Iteration: 765, Train loss: -0.0173, rewards: 0.5493\n",
      "Iteration: 770, Train loss: -0.0222, rewards: 0.5164\n",
      "Iteration: 775, Train loss: -0.0183, rewards: 0.5433\n",
      "Iteration: 780, Train loss: -0.0192, rewards: 0.5015\n",
      "Iteration: 785, Train loss: -0.0149, rewards: 0.5612\n",
      "Iteration: 790, Train loss: -0.0155, rewards: 0.5284\n",
      "Iteration: 795, Train loss: -0.0189, rewards: 0.5493\n",
      "Iteration: 800, Train loss: -0.0195, rewards: 0.5582\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -0.0150, rewards: 0.5373\n",
      "Iteration: 810, Train loss: -0.0233, rewards: 0.5463\n",
      "Iteration: 815, Train loss: -0.0211, rewards: 0.5254\n",
      "Iteration: 820, Train loss: -0.0217, rewards: 0.5224\n",
      "Iteration: 825, Train loss: -0.0180, rewards: 0.4985\n",
      "Iteration: 830, Train loss: -0.0207, rewards: 0.5284\n",
      "Iteration: 835, Train loss: -0.0233, rewards: 0.5522\n",
      "Iteration: 840, Train loss: -0.0193, rewards: 0.5254\n",
      "Iteration: 845, Train loss: -0.0255, rewards: 0.5582\n",
      "Iteration: 850, Train loss: -0.0275, rewards: 0.5254\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -0.0247, rewards: 0.5552\n",
      "Iteration: 860, Train loss: -0.0257, rewards: 0.5164\n",
      "Iteration: 865, Train loss: -0.0156, rewards: 0.5642\n",
      "Iteration: 870, Train loss: -0.0180, rewards: 0.5373\n",
      "Iteration: 875, Train loss: -0.0210, rewards: 0.5493\n",
      "Iteration: 880, Train loss: -0.0198, rewards: 0.5134\n",
      "Iteration: 885, Train loss: -0.0241, rewards: 0.5552\n",
      "Iteration: 890, Train loss: -0.0209, rewards: 0.5313\n",
      "Iteration: 895, Train loss: -0.0220, rewards: 0.4985\n",
      "Iteration: 900, Train loss: -0.0233, rewards: 0.5373\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -0.0183, rewards: 0.5284\n",
      "Iteration: 910, Train loss: -0.0216, rewards: 0.5701\n",
      "Iteration: 915, Train loss: -0.0202, rewards: 0.4806\n",
      "Iteration: 920, Train loss: -0.0210, rewards: 0.5104\n",
      "Iteration: 925, Train loss: -0.0235, rewards: 0.5075\n",
      "Iteration: 930, Train loss: -0.0274, rewards: 0.5313\n",
      "Iteration: 935, Train loss: -0.0250, rewards: 0.5463\n",
      "Iteration: 940, Train loss: -0.0174, rewards: 0.5433\n",
      "Iteration: 945, Train loss: -0.0153, rewards: 0.5582\n",
      "Iteration: 950, Train loss: -0.0144, rewards: 0.5104\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -0.0150, rewards: 0.5313\n",
      "Iteration: 960, Train loss: -0.0183, rewards: 0.5552\n",
      "Iteration: 965, Train loss: -0.0183, rewards: 0.5701\n",
      "Iteration: 970, Train loss: -0.0158, rewards: 0.5134\n",
      "Iteration: 975, Train loss: -0.0198, rewards: 0.5582\n",
      "Iteration: 980, Train loss: -0.0289, rewards: 0.5373\n",
      "Iteration: 985, Train loss: -0.0144, rewards: 0.5493\n",
      "Iteration: 990, Train loss: -0.0246, rewards: 0.5373\n",
      "Iteration: 995, Train loss: -0.0142, rewards: 0.5134\n",
      "Iteration: 1000, Train loss: -0.0183, rewards: 0.4746\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -0.0170, rewards: 0.5552\n",
      "Iteration: 1010, Train loss: -0.0177, rewards: 0.5642\n",
      "Iteration: 1015, Train loss: -0.0188, rewards: 0.4896\n",
      "Iteration: 1020, Train loss: -0.0206, rewards: 0.4925\n",
      "Iteration: 1025, Train loss: -0.0166, rewards: 0.5672\n",
      "Iteration: 1030, Train loss: -0.0255, rewards: 0.5343\n",
      "Iteration: 1035, Train loss: -0.0193, rewards: 0.5045\n",
      "Iteration: 1040, Train loss: -0.0155, rewards: 0.5224\n",
      "Iteration: 1045, Train loss: -0.0220, rewards: 0.5075\n",
      "Iteration: 1050, Train loss: -0.0184, rewards: 0.5642\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -0.0155, rewards: 0.4985\n",
      "Iteration: 1060, Train loss: -0.0258, rewards: 0.5493\n",
      "Iteration: 1065, Train loss: -0.0172, rewards: 0.5552\n",
      "Iteration: 1070, Train loss: -0.0175, rewards: 0.5254\n",
      "Iteration: 1075, Train loss: -0.0245, rewards: 0.4776\n",
      "Iteration: 1080, Train loss: -0.0176, rewards: 0.5731\n",
      "Iteration: 1085, Train loss: -0.0195, rewards: 0.5463\n",
      "Iteration: 1090, Train loss: -0.0247, rewards: 0.4925\n",
      "Iteration: 1095, Train loss: -0.0218, rewards: 0.5284\n",
      "Iteration: 1100, Train loss: -0.0245, rewards: 0.5672\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.0292, rewards: 0.5672\n",
      "Iteration: 1110, Train loss: -0.0216, rewards: 0.5134\n",
      "Iteration: 1115, Train loss: -0.0270, rewards: 0.4836\n",
      "Iteration: 1120, Train loss: -0.0235, rewards: 0.5343\n",
      "Iteration: 1125, Train loss: -0.0211, rewards: 0.5582\n",
      "Iteration: 1130, Train loss: -0.0177, rewards: 0.5224\n",
      "Iteration: 1135, Train loss: -0.0137, rewards: 0.4896\n",
      "Iteration: 1140, Train loss: -0.0223, rewards: 0.5224\n",
      "Iteration: 1145, Train loss: -0.0221, rewards: 0.5701\n",
      "Iteration: 1150, Train loss: -0.0170, rewards: 0.5612\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -0.0177, rewards: 0.5493\n",
      "Iteration: 1160, Train loss: -0.0227, rewards: 0.5701\n",
      "Iteration: 1165, Train loss: -0.0195, rewards: 0.5224\n",
      "Iteration: 1170, Train loss: -0.0276, rewards: 0.5403\n",
      "Iteration: 1175, Train loss: -0.0206, rewards: 0.5522\n",
      "Iteration: 1180, Train loss: -0.0144, rewards: 0.5164\n",
      "Iteration: 1185, Train loss: -0.0225, rewards: 0.5075\n",
      "Iteration: 1190, Train loss: -0.0196, rewards: 0.5522\n",
      "Iteration: 1195, Train loss: -0.0213, rewards: 0.5791\n",
      "Iteration: 1200, Train loss: -0.0159, rewards: 0.5582\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -0.0190, rewards: 0.4687\n",
      "Iteration: 1210, Train loss: -0.0217, rewards: 0.5104\n",
      "Iteration: 1215, Train loss: -0.0230, rewards: 0.5015\n",
      "Iteration: 1220, Train loss: -0.0214, rewards: 0.5463\n",
      "Iteration: 1225, Train loss: -0.0162, rewards: 0.5582\n",
      "Iteration: 1230, Train loss: -0.0225, rewards: 0.5642\n",
      "Iteration: 1235, Train loss: -0.0229, rewards: 0.5373\n",
      "Iteration: 1240, Train loss: -0.0181, rewards: 0.5552\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -0.0268, rewards: 0.5045\n",
      "Iteration: 1250, Train loss: -0.0225, rewards: 0.5075\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -0.0195, rewards: 0.5134\n",
      "Iteration: 1260, Train loss: -0.0220, rewards: 0.5343\n",
      "Iteration: 1265, Train loss: -0.0240, rewards: 0.5134\n",
      "Iteration: 1270, Train loss: -0.0238, rewards: 0.5224\n",
      "Iteration: 1275, Train loss: -0.0152, rewards: 0.5075\n",
      "Iteration: 1280, Train loss: -0.0173, rewards: 0.4537\n",
      "Iteration: 1285, Train loss: -0.0181, rewards: 0.5672\n",
      "Iteration: 1290, Train loss: -0.0261, rewards: 0.5254\n",
      "Iteration: 1295, Train loss: -0.0264, rewards: 0.5552\n",
      "Iteration: 1300, Train loss: -0.0308, rewards: 0.5433\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -0.0194, rewards: 0.5015\n",
      "Iteration: 1310, Train loss: -0.0207, rewards: 0.5254\n",
      "Iteration: 1315, Train loss: -0.0239, rewards: 0.5194\n",
      "Iteration: 1320, Train loss: -0.0213, rewards: 0.5463\n",
      "Iteration: 1325, Train loss: -0.0238, rewards: 0.4955\n",
      "Iteration: 1330, Train loss: -0.0179, rewards: 0.5881\n",
      "Iteration: 1335, Train loss: -0.0164, rewards: 0.5254\n",
      "Iteration: 1340, Train loss: -0.0251, rewards: 0.5493\n",
      "Iteration: 1345, Train loss: -0.0206, rewards: 0.4925\n",
      "Iteration: 1350, Train loss: -0.0205, rewards: 0.5642\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -0.0286, rewards: 0.5701\n",
      "Iteration: 1360, Train loss: -0.0216, rewards: 0.5224\n",
      "Iteration: 1365, Train loss: -0.0206, rewards: 0.5403\n",
      "Iteration: 1370, Train loss: -0.0173, rewards: 0.5104\n",
      "Iteration: 1375, Train loss: -0.0199, rewards: 0.5493\n",
      "Iteration: 1380, Train loss: -0.0233, rewards: 0.5164\n",
      "Iteration: 1385, Train loss: -0.0211, rewards: 0.4985\n",
      "Iteration: 1390, Train loss: -0.0250, rewards: 0.4537\n",
      "Iteration: 1395, Train loss: -0.0258, rewards: 0.4866\n",
      "Iteration: 1400, Train loss: -0.0210, rewards: 0.5284\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -0.0299, rewards: 0.5313\n",
      "Iteration: 1410, Train loss: -0.0309, rewards: 0.4687\n",
      "Iteration: 1415, Train loss: -0.0171, rewards: 0.5493\n",
      "Iteration: 1420, Train loss: -0.0110, rewards: 0.5194\n",
      "Iteration: 1425, Train loss: -0.0204, rewards: 0.5104\n",
      "Iteration: 1430, Train loss: -0.0201, rewards: 0.5045\n",
      "Iteration: 1435, Train loss: -0.0214, rewards: 0.5791\n",
      "Iteration: 1440, Train loss: -0.0199, rewards: 0.4836\n",
      "Iteration: 1445, Train loss: -0.0245, rewards: 0.5284\n",
      "Iteration: 1450, Train loss: -0.0145, rewards: 0.5612\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -0.0176, rewards: 0.5284\n",
      "Iteration: 1460, Train loss: -0.0127, rewards: 0.5045\n",
      "Iteration: 1465, Train loss: -0.0183, rewards: 0.5642\n",
      "Iteration: 1470, Train loss: -0.0135, rewards: 0.5194\n",
      "Iteration: 1475, Train loss: -0.0143, rewards: 0.5313\n",
      "Iteration: 1480, Train loss: -0.0186, rewards: 0.5403\n",
      "Iteration: 1485, Train loss: -0.0263, rewards: 0.5373\n",
      "Iteration: 1490, Train loss: -0.0175, rewards: 0.5642\n",
      "Iteration: 1495, Train loss: -0.0188, rewards: 0.5552\n",
      "Iteration: 1500, Train loss: -0.0176, rewards: 0.5313\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -0.0269, rewards: 0.5284\n",
      "Iteration: 1510, Train loss: -0.0378, rewards: 0.5582\n",
      "Iteration: 1515, Train loss: -0.0213, rewards: 0.5313\n",
      "Iteration: 1520, Train loss: -0.0208, rewards: 0.5463\n",
      "Iteration: 1525, Train loss: -0.0179, rewards: 0.4955\n",
      "Iteration: 1530, Train loss: -0.0121, rewards: 0.5701\n",
      "Iteration: 1535, Train loss: -0.0178, rewards: 0.5104\n",
      "Iteration: 1540, Train loss: -0.0138, rewards: 0.4985\n",
      "Iteration: 1545, Train loss: -0.0246, rewards: 0.5224\n",
      "Iteration: 1550, Train loss: -0.0165, rewards: 0.5761\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.0178, rewards: 0.4836\n",
      "Iteration: 1560, Train loss: -0.0273, rewards: 0.5403\n",
      "Iteration: 1565, Train loss: -0.0113, rewards: 0.5313\n",
      "Iteration: 1570, Train loss: -0.0191, rewards: 0.5224\n",
      "Iteration: 1575, Train loss: -0.0255, rewards: 0.5045\n",
      "Iteration: 1580, Train loss: -0.0158, rewards: 0.5134\n",
      "Iteration: 1585, Train loss: -0.0183, rewards: 0.5612\n",
      "Iteration: 1590, Train loss: -0.0208, rewards: 0.5254\n",
      "Iteration: 1595, Train loss: -0.0248, rewards: 0.5343\n",
      "Iteration: 1600, Train loss: -0.0179, rewards: 0.5731\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.0199, rewards: 0.4985\n",
      "Iteration: 1610, Train loss: -0.0184, rewards: 0.5284\n",
      "Iteration: 1615, Train loss: -0.0145, rewards: 0.4985\n",
      "Iteration: 1620, Train loss: -0.0284, rewards: 0.5104\n",
      "Iteration: 1625, Train loss: -0.0265, rewards: 0.5612\n",
      "Iteration: 1630, Train loss: -0.0194, rewards: 0.5403\n",
      "Iteration: 1635, Train loss: -0.0129, rewards: 0.6000\n",
      "Iteration: 1640, Train loss: -0.0232, rewards: 0.5582\n",
      "Iteration: 1645, Train loss: -0.0299, rewards: 0.5403\n",
      "Iteration: 1650, Train loss: -0.0120, rewards: 0.5612\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -0.0184, rewards: 0.5194\n",
      "Iteration: 1660, Train loss: -0.0195, rewards: 0.5582\n",
      "Iteration: 1665, Train loss: -0.0144, rewards: 0.4716\n",
      "Iteration: 1670, Train loss: -0.0205, rewards: 0.5522\n",
      "Iteration: 1675, Train loss: -0.0229, rewards: 0.5642\n",
      "Iteration: 1680, Train loss: -0.0175, rewards: 0.5194\n",
      "Iteration: 1685, Train loss: -0.0179, rewards: 0.5672\n",
      "Iteration: 1690, Train loss: -0.0235, rewards: 0.5134\n",
      "Iteration: 1695, Train loss: -0.0247, rewards: 0.5224\n",
      "Iteration: 1700, Train loss: -0.0187, rewards: 0.5403\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -0.0188, rewards: 0.5343\n",
      "Iteration: 1710, Train loss: -0.0145, rewards: 0.4896\n",
      "Iteration: 1715, Train loss: -0.0160, rewards: 0.5522\n",
      "Iteration: 1720, Train loss: -0.0252, rewards: 0.5254\n",
      "Iteration: 1725, Train loss: -0.0268, rewards: 0.5373\n",
      "Iteration: 1730, Train loss: -0.0181, rewards: 0.5433\n",
      "Iteration: 1735, Train loss: -0.0134, rewards: 0.4627\n",
      "Iteration: 1740, Train loss: -0.0198, rewards: 0.5731\n",
      "Iteration: 1745, Train loss: -0.0184, rewards: 0.5612\n",
      "Iteration: 1750, Train loss: -0.0169, rewards: 0.5134\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.0210, rewards: 0.5731\n",
      "Iteration: 1760, Train loss: -0.0137, rewards: 0.5463\n",
      "Iteration: 1765, Train loss: -0.0186, rewards: 0.5552\n",
      "Iteration: 1770, Train loss: -0.0173, rewards: 0.5373\n",
      "Iteration: 1775, Train loss: -0.0158, rewards: 0.5164\n",
      "Iteration: 1780, Train loss: -0.0167, rewards: 0.5701\n",
      "Iteration: 1785, Train loss: -0.0189, rewards: 0.5642\n",
      "Iteration: 1790, Train loss: -0.0276, rewards: 0.5373\n",
      "Iteration: 1795, Train loss: -0.0132, rewards: 0.5403\n",
      "Iteration: 1800, Train loss: -0.0197, rewards: 0.5463\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5212\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -0.0171, rewards: 0.4776\n",
      "Iteration: 1810, Train loss: -0.0233, rewards: 0.5493\n",
      "Iteration: 1815, Train loss: -0.0257, rewards: 0.5522\n",
      "Iteration: 1820, Train loss: -0.0231, rewards: 0.5254\n",
      "Iteration: 1825, Train loss: -0.0182, rewards: 0.5433\n",
      "Iteration: 1830, Train loss: -0.0178, rewards: 0.4955\n",
      "Iteration: 1835, Train loss: -0.0167, rewards: 0.5612\n",
      "Iteration: 1840, Train loss: -0.0188, rewards: 0.5821\n",
      "Iteration: 1845, Train loss: -0.0286, rewards: 0.5403\n",
      "Iteration: 1850, Train loss: -0.0193, rewards: 0.4836\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -0.0182, rewards: 0.4955\n",
      "Iteration: 1860, Train loss: -0.0241, rewards: 0.5045\n",
      "Iteration: 1865, Train loss: -0.0189, rewards: 0.5075\n",
      "Iteration: 1870, Train loss: -0.0160, rewards: 0.5582\n",
      "Iteration: 1875, Train loss: -0.0231, rewards: 0.4955\n",
      "Iteration: 1880, Train loss: -0.0170, rewards: 0.5791\n",
      "Iteration: 1885, Train loss: -0.0188, rewards: 0.5403\n",
      "Iteration: 1890, Train loss: -0.0241, rewards: 0.5373\n",
      "Iteration: 1895, Train loss: -0.0212, rewards: 0.5164\n",
      "Iteration: 1900, Train loss: -0.0202, rewards: 0.4925\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -0.0235, rewards: 0.5284\n",
      "Iteration: 1910, Train loss: -0.0219, rewards: 0.5433\n",
      "Iteration: 1915, Train loss: -0.0217, rewards: 0.5373\n",
      "Iteration: 1920, Train loss: -0.0135, rewards: 0.5164\n",
      "Iteration: 1925, Train loss: -0.0215, rewards: 0.5403\n",
      "Iteration: 1930, Train loss: -0.0243, rewards: 0.5075\n",
      "Iteration: 1935, Train loss: -0.0239, rewards: 0.5851\n",
      "Iteration: 1940, Train loss: -0.0190, rewards: 0.5075\n",
      "Iteration: 1945, Train loss: -0.0228, rewards: 0.5194\n",
      "Iteration: 1950, Train loss: -0.0223, rewards: 0.5134\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -0.0174, rewards: 0.5851\n",
      "Iteration: 1960, Train loss: -0.0189, rewards: 0.5164\n",
      "Iteration: 1965, Train loss: -0.0197, rewards: 0.5403\n",
      "Iteration: 1970, Train loss: -0.0162, rewards: 0.5134\n",
      "Iteration: 1975, Train loss: -0.0134, rewards: 0.5582\n",
      "Iteration: 1980, Train loss: -0.0134, rewards: 0.5104\n",
      "Iteration: 1985, Train loss: -0.0196, rewards: 0.5313\n",
      "Iteration: 1990, Train loss: -0.0201, rewards: 0.5194\n",
      "Iteration: 1995, Train loss: -0.0247, rewards: 0.5075\n",
      "Iteration: 2000, Train loss: -0.0226, rewards: 0.5075\n",
      "Eval:\n",
      "Hits@1: 0.5106, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5213\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personborninlocation//test_beam/ ]\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0466, MRR: 0.0193\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.37672393812290184 (193 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:57:51,222]\u001b[0m Trial 0 finished with value: 0.37672393812290184 and parameters: {'lr': 0.0098624645019596, 'bs': 67, 'b': 0.11269754444615498, 'l': 0.46014476820721034, 'ee': 50}. Best is trial 0 with value: 0.37672393812290184.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: 0.0010, rewards: 0.5402\n",
      "Iteration: 20, Train loss: -0.0004, rewards: 0.3780\n",
      "Iteration: 30, Train loss: -0.0006, rewards: 0.3310\n",
      "Iteration: 40, Train loss: -0.0001, rewards: 0.3760\n",
      "Iteration: 50, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 60, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 70, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 80, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 90, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 100, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0266, MRR: 0.0289\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 120, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 130, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 140, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 150, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 160, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 170, Train loss: -0.0000, rewards: 0.0020\n",
      "Iteration: 180, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 190, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 200, Train loss: -0.0002, rewards: 0.1270\n",
      "Eval:\n",
      "Hits@1: 0.4521, Hits@3: 0.4840, Hits@10: 0.5266, MRR: 0.4758\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.0000, rewards: 0.0510\n",
      "Iteration: 220, Train loss: 0.0033, rewards: 0.2444\n",
      "Iteration: 230, Train loss: -0.0018, rewards: 0.5350\n",
      "Iteration: 240, Train loss: -0.0005, rewards: 0.5130\n",
      "Iteration: 250, Train loss: -0.0003, rewards: 0.5450\n",
      "Iteration: 260, Train loss: -0.0007, rewards: 0.5180\n",
      "Iteration: 270, Train loss: -0.0002, rewards: 0.5460\n",
      "Iteration: 280, Train loss: -0.0014, rewards: 0.5370\n",
      "Iteration: 290, Train loss: -0.0027, rewards: 0.5424\n",
      "Iteration: 300, Train loss: -0.0004, rewards: 0.5370\n",
      "Eval:\n",
      "Hits@1: 0.5266, Hits@3: 0.5266, Hits@10: 0.5372, MRR: 0.5292\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.0000, rewards: 0.5510\n",
      "Iteration: 320, Train loss: -0.0002, rewards: 0.5460\n",
      "Iteration: 330, Train loss: -0.0002, rewards: 0.5350\n",
      "Iteration: 340, Train loss: -0.0008, rewards: 0.5510\n",
      "Iteration: 350, Train loss: -0.0009, rewards: 0.5700\n",
      "Iteration: 360, Train loss: -0.0007, rewards: 0.5530\n",
      "Iteration: 370, Train loss: -0.0039, rewards: 0.5290\n",
      "Iteration: 380, Train loss: -0.0017, rewards: 0.5680\n",
      "Iteration: 390, Train loss: -0.0032, rewards: 0.5760\n",
      "Iteration: 400, Train loss: -0.0019, rewards: 0.5860\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5268\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.0020, rewards: 0.5485\n",
      "Iteration: 420, Train loss: -0.0047, rewards: 0.5500\n",
      "Iteration: 430, Train loss: -0.0025, rewards: 0.5520\n",
      "Iteration: 440, Train loss: -0.0019, rewards: 0.5850\n",
      "Iteration: 450, Train loss: -0.0027, rewards: 0.5570\n",
      "Iteration: 460, Train loss: -0.0025, rewards: 0.5420\n",
      "Iteration: 470, Train loss: -0.0027, rewards: 0.5420\n",
      "Iteration: 480, Train loss: -0.0027, rewards: 0.5980\n",
      "Iteration: 490, Train loss: -0.0018, rewards: 0.5530\n",
      "Iteration: 500, Train loss: -0.0056, rewards: 0.5570\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5293\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.0056, rewards: 0.5490\n",
      "Iteration: 520, Train loss: -0.0041, rewards: 0.5740\n",
      "Iteration: 530, Train loss: -0.0032, rewards: 0.5420\n",
      "Iteration: 540, Train loss: -0.0024, rewards: 0.5450\n",
      "Iteration: 550, Train loss: -0.0036, rewards: 0.5290\n",
      "Iteration: 560, Train loss: -0.0036, rewards: 0.5570\n",
      "Iteration: 570, Train loss: -0.0047, rewards: 0.5510\n",
      "Iteration: 580, Train loss: -0.0046, rewards: 0.5380\n",
      "Iteration: 590, Train loss: -0.0038, rewards: 0.5440\n",
      "Iteration: 600, Train loss: -0.0056, rewards: 0.5590\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5293\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.0047, rewards: 0.5480\n",
      "Iteration: 620, Train loss: -0.0070, rewards: 0.5670\n",
      "Iteration: 630, Train loss: -0.0033, rewards: 0.5430\n",
      "Iteration: 640, Train loss: -0.0083, rewards: 0.5380\n",
      "Iteration: 650, Train loss: -0.0054, rewards: 0.5830\n",
      "Iteration: 660, Train loss: -0.0066, rewards: 0.5350\n",
      "Iteration: 670, Train loss: -0.0081, rewards: 0.5620\n",
      "Iteration: 680, Train loss: -0.0123, rewards: 0.5590\n",
      "Iteration: 690, Train loss: -0.0049, rewards: 0.5580\n",
      "Iteration: 700, Train loss: -0.0033, rewards: 0.5630\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5290\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.0044, rewards: 0.5730\n",
      "Iteration: 720, Train loss: -0.0030, rewards: 0.5490\n",
      "Iteration: 730, Train loss: -0.0049, rewards: 0.5590\n",
      "Iteration: 740, Train loss: -0.0059, rewards: 0.5190\n",
      "Iteration: 750, Train loss: -0.0071, rewards: 0.5430\n",
      "Iteration: 760, Train loss: -0.0115, rewards: 0.5380\n",
      "Iteration: 770, Train loss: -0.0142, rewards: 0.5410\n",
      "Iteration: 780, Train loss: -0.0114, rewards: 0.5510\n",
      "Iteration: 790, Train loss: -0.0099, rewards: 0.5570\n",
      "Iteration: 800, Train loss: -0.0121, rewards: 0.5550\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5288\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -0.0125, rewards: 0.5600\n",
      "Iteration: 820, Train loss: -0.0096, rewards: 0.5410\n",
      "Iteration: 830, Train loss: -0.0087, rewards: 0.5470\n",
      "Iteration: 840, Train loss: -0.0085, rewards: 0.5580\n",
      "Iteration: 850, Train loss: -0.0120, rewards: 0.5200\n",
      "Iteration: 860, Train loss: -0.0093, rewards: 0.5630\n",
      "Iteration: 870, Train loss: -0.0088, rewards: 0.5640\n",
      "Iteration: 880, Train loss: -0.0096, rewards: 0.5560\n",
      "Iteration: 890, Train loss: -0.0083, rewards: 0.5550\n",
      "Iteration: 900, Train loss: -0.0090, rewards: 0.5430\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5291\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.0116, rewards: 0.5370\n",
      "Iteration: 920, Train loss: -0.0077, rewards: 0.5510\n",
      "Iteration: 930, Train loss: -0.0108, rewards: 0.5560\n",
      "Iteration: 940, Train loss: -0.0094, rewards: 0.5440\n",
      "Iteration: 950, Train loss: -0.0097, rewards: 0.5380\n",
      "Iteration: 960, Train loss: -0.0134, rewards: 0.5440\n",
      "Iteration: 970, Train loss: -0.0123, rewards: 0.5570\n",
      "Iteration: 980, Train loss: -0.0181, rewards: 0.5380\n",
      "Iteration: 990, Train loss: -0.0155, rewards: 0.5370\n",
      "Iteration: 1000, Train loss: -0.0107, rewards: 0.5480\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5291\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.0117, rewards: 0.5590\n",
      "Iteration: 1020, Train loss: -0.0102, rewards: 0.5230\n",
      "Iteration: 1030, Train loss: -0.0112, rewards: 0.5410\n",
      "Iteration: 1040, Train loss: -0.0107, rewards: 0.5520\n",
      "Iteration: 1050, Train loss: -0.0136, rewards: 0.5300\n",
      "Iteration: 1060, Train loss: -0.0114, rewards: 0.5530\n",
      "Iteration: 1070, Train loss: -0.0107, rewards: 0.5610\n",
      "Iteration: 1080, Train loss: -0.0183, rewards: 0.5610\n",
      "Iteration: 1090, Train loss: -0.0249, rewards: 0.5680\n",
      "Iteration: 1100, Train loss: -0.0174, rewards: 0.5500\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5291\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.0151, rewards: 0.5290\n",
      "Iteration: 1120, Train loss: -0.0136, rewards: 0.5550\n",
      "Iteration: 1130, Train loss: -0.0116, rewards: 0.5700\n",
      "Iteration: 1140, Train loss: -0.0110, rewards: 0.5500\n",
      "Iteration: 1150, Train loss: -0.0126, rewards: 0.5290\n",
      "Iteration: 1160, Train loss: -0.0141, rewards: 0.5620\n",
      "Iteration: 1170, Train loss: -0.0165, rewards: 0.5570\n",
      "Iteration: 1180, Train loss: -0.0211, rewards: 0.5510\n",
      "Iteration: 1190, Train loss: -0.0257, rewards: 0.5670\n",
      "Iteration: 1200, Train loss: -0.0182, rewards: 0.5490\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5290\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.0254, rewards: 0.5250\n",
      "Iteration: 1220, Train loss: -0.0169, rewards: 0.5320\n",
      "Iteration: 1230, Train loss: -0.0151, rewards: 0.5850\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.0121, rewards: 0.5440\n",
      "Iteration: 1250, Train loss: -0.0099, rewards: 0.5250\n",
      "Iteration: 1260, Train loss: -0.0118, rewards: 0.5520\n",
      "Iteration: 1270, Train loss: -0.0110, rewards: 0.5460\n",
      "Iteration: 1280, Train loss: -0.0111, rewards: 0.5440\n",
      "Iteration: 1290, Train loss: -0.0113, rewards: 0.5610\n",
      "Iteration: 1300, Train loss: -0.0126, rewards: 0.5410\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5426, MRR: 0.5292\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.0110, rewards: 0.5540\n",
      "Iteration: 1320, Train loss: -0.0100, rewards: 0.5430\n",
      "Iteration: 1330, Train loss: -0.0119, rewards: 0.5580\n",
      "Iteration: 1340, Train loss: -0.0158, rewards: 0.5190\n",
      "Iteration: 1350, Train loss: -0.0126, rewards: 0.5510\n",
      "Iteration: 1360, Train loss: -0.0133, rewards: 0.5091\n",
      "Iteration: 1370, Train loss: -0.0084, rewards: 0.5360\n",
      "Iteration: 1380, Train loss: -0.0128, rewards: 0.5360\n",
      "Iteration: 1390, Train loss: -0.0139, rewards: 0.5740\n",
      "Iteration: 1400, Train loss: -0.0141, rewards: 0.5610\n",
      "Eval:\n",
      "Hits@1: 0.5213, Hits@3: 0.5319, Hits@10: 0.5372, MRR: 0.5284\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.0135, rewards: 0.5370\n",
      "Iteration: 1420, Train loss: -0.0175, rewards: 0.5410\n",
      "Iteration: 1430, Train loss: -0.0150, rewards: 0.5570\n",
      "Iteration: 1440, Train loss: -0.0219, rewards: 0.5390\n",
      "Iteration: 1450, Train loss: -0.0158, rewards: 0.5520\n",
      "Iteration: 1460, Train loss: -0.0147, rewards: 0.5350\n",
      "Iteration: 1470, Train loss: -0.0118, rewards: 0.5530\n",
      "Iteration: 1480, Train loss: -0.0164, rewards: 0.5720\n",
      "Iteration: 1490, Train loss: -0.0129, rewards: 0.5510\n",
      "Iteration: 1500, Train loss: -0.0123, rewards: 0.5520\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5213, Hits@10: 0.5372, MRR: 0.5221\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.0109, rewards: 0.5120\n",
      "Iteration: 1520, Train loss: -0.0067, rewards: 0.5270\n",
      "Iteration: 1530, Train loss: -0.0094, rewards: 0.5340\n",
      "Iteration: 1540, Train loss: -0.0105, rewards: 0.5420\n",
      "Iteration: 1550, Train loss: -0.0119, rewards: 0.5500\n",
      "Iteration: 1560, Train loss: -0.0101, rewards: 0.5030\n",
      "Iteration: 1570, Train loss: -0.0076, rewards: 0.5481\n",
      "Iteration: 1580, Train loss: -0.0077, rewards: 0.5380\n",
      "Iteration: 1590, Train loss: -0.0136, rewards: 0.5690\n",
      "Iteration: 1600, Train loss: -0.0093, rewards: 0.5350\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5244\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.0076, rewards: 0.5540\n",
      "Iteration: 1620, Train loss: -0.0097, rewards: 0.5390\n",
      "Iteration: 1630, Train loss: -0.0042, rewards: 0.5580\n",
      "Iteration: 1640, Train loss: -0.0080, rewards: 0.5220\n",
      "Iteration: 1650, Train loss: -0.0078, rewards: 0.5180\n",
      "Iteration: 1660, Train loss: -0.0047, rewards: 0.5220\n",
      "Iteration: 1670, Train loss: -0.0091, rewards: 0.5390\n",
      "Iteration: 1680, Train loss: -0.0085, rewards: 0.5360\n",
      "Iteration: 1690, Train loss: -0.0107, rewards: 0.5370\n",
      "Iteration: 1700, Train loss: -0.0157, rewards: 0.5390\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5244\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -0.0133, rewards: 0.5370\n",
      "Iteration: 1720, Train loss: -0.0127, rewards: 0.5390\n",
      "Iteration: 1730, Train loss: -0.0149, rewards: 0.5190\n",
      "Iteration: 1740, Train loss: -0.0114, rewards: 0.5420\n",
      "Iteration: 1750, Train loss: -0.0105, rewards: 0.5160\n",
      "Iteration: 1760, Train loss: -0.0123, rewards: 0.5250\n",
      "Iteration: 1770, Train loss: -0.0134, rewards: 0.5540\n",
      "Iteration: 1780, Train loss: -0.0139, rewards: 0.5270\n",
      "Iteration: 1790, Train loss: -0.0141, rewards: 0.5480\n",
      "Iteration: 1800, Train loss: -0.0172, rewards: 0.5420\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5266, Hits@10: 0.5426, MRR: 0.5245\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.0106, rewards: 0.5070\n",
      "Iteration: 1820, Train loss: -0.0111, rewards: 0.5280\n",
      "Iteration: 1830, Train loss: -0.0134, rewards: 0.5350\n",
      "Iteration: 1840, Train loss: -0.0105, rewards: 0.5240\n",
      "Iteration: 1850, Train loss: -0.0110, rewards: 0.5430\n",
      "Iteration: 1860, Train loss: -0.0120, rewards: 0.5580\n",
      "Iteration: 1870, Train loss: -0.0151, rewards: 0.5320\n",
      "Iteration: 1880, Train loss: -0.0106, rewards: 0.5390\n",
      "Iteration: 1890, Train loss: -0.0165, rewards: 0.5040\n",
      "Iteration: 1900, Train loss: -0.0110, rewards: 0.5170\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5266, Hits@10: 0.5372, MRR: 0.5243\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -0.0139, rewards: 0.5320\n",
      "Iteration: 1920, Train loss: -0.0119, rewards: 0.5300\n",
      "Iteration: 1930, Train loss: -0.0110, rewards: 0.5400\n",
      "Iteration: 1940, Train loss: -0.0143, rewards: 0.5280\n",
      "Iteration: 1950, Train loss: -0.0140, rewards: 0.5320\n",
      "Iteration: 1960, Train loss: -0.0159, rewards: 0.5200\n",
      "Iteration: 1970, Train loss: -0.0137, rewards: 0.5370\n",
      "Iteration: 1980, Train loss: -0.0137, rewards: 0.5390\n",
      "Iteration: 1990, Train loss: -0.0160, rewards: 0.5080\n",
      "Iteration: 2000, Train loss: -0.0108, rewards: 0.5450\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5266, Hits@10: 0.5372, MRR: 0.5243\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personborninlocation//test_beam/ ]\n",
      "Hits@1: 0.5130, Hits@3: 0.5544, Hits@10: 0.6114, MRR: 0.5416\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.765713388511316 (193 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 22:50:26,415]\u001b[0m Trial 1 finished with value: 0.765713388511316 and parameters: {'lr': 0.0044829794404304185, 'bs': 100, 'b': 0.005082138740448772, 'l': 0.14497033499140466, 'ee': 100}. Best is trial 1 with value: 0.765713388511316.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.1387, rewards: 0.5184\n",
      "Iteration: 10, Train loss: 0.0661, rewards: 0.5190\n",
      "Iteration: 15, Train loss: 0.0581, rewards: 0.5363\n",
      "Iteration: 20, Train loss: 0.0530, rewards: 0.5533\n",
      "Iteration: 25, Train loss: 0.0129, rewards: 0.5650\n",
      "Iteration: 30, Train loss: 0.0143, rewards: 0.5457\n",
      "Iteration: 35, Train loss: -0.0093, rewards: 0.5909\n",
      "Iteration: 40, Train loss: 0.0694, rewards: 0.5870\n",
      "Iteration: 45, Train loss: 0.0135, rewards: 0.5540\n",
      "Iteration: 50, Train loss: 0.0290, rewards: 0.5920\n",
      "Eval:\n",
      "Hits@1: 0.5532, Hits@3: 0.5532, Hits@10: 0.5532, MRR: 0.5532\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: 0.0844, rewards: 0.5887\n",
      "Iteration: 60, Train loss: 0.0680, rewards: 0.5385\n",
      "Iteration: 65, Train loss: 0.0064, rewards: 0.5459\n",
      "Iteration: 70, Train loss: 0.0814, rewards: 0.5984\n",
      "Iteration: 75, Train loss: 0.0945, rewards: 0.5875\n",
      "Iteration: 80, Train loss: 0.0988, rewards: 0.5563\n",
      "Iteration: 85, Train loss: 0.0312, rewards: 0.5936\n",
      "Iteration: 90, Train loss: 0.0631, rewards: 0.5932\n",
      "Iteration: 95, Train loss: 0.1102, rewards: 0.6025\n",
      "Iteration: 100, Train loss: 0.0703, rewards: 0.6163\n",
      "Eval:\n",
      "Hits@1: 0.5585, Hits@3: 0.5745, Hits@10: 0.5798, MRR: 0.5652\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: 0.0094, rewards: 0.5803\n",
      "Iteration: 110, Train loss: 0.0516, rewards: 0.5753\n",
      "Iteration: 115, Train loss: 0.0741, rewards: 0.5675\n",
      "Iteration: 120, Train loss: 0.0873, rewards: 0.5771\n",
      "Iteration: 125, Train loss: 0.0711, rewards: 0.5829\n",
      "Iteration: 130, Train loss: 0.0550, rewards: 0.5709\n",
      "Iteration: 135, Train loss: 0.0237, rewards: 0.6372\n",
      "Iteration: 140, Train loss: 0.0475, rewards: 0.5970\n",
      "Iteration: 145, Train loss: 0.0956, rewards: 0.6067\n",
      "Iteration: 150, Train loss: 0.0257, rewards: 0.6078\n",
      "Eval:\n",
      "Hits@1: 0.5585, Hits@3: 0.5957, Hits@10: 0.6064, MRR: 0.5757\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: 0.0250, rewards: 0.6076\n",
      "Iteration: 160, Train loss: 0.0360, rewards: 0.5918\n",
      "Iteration: 165, Train loss: 0.0466, rewards: 0.5670\n",
      "Iteration: 170, Train loss: 0.0631, rewards: 0.6033\n",
      "Iteration: 175, Train loss: 0.0650, rewards: 0.5621\n",
      "Iteration: 180, Train loss: 0.0663, rewards: 0.5953\n",
      "Iteration: 185, Train loss: 0.0601, rewards: 0.5775\n",
      "Iteration: 190, Train loss: 0.0253, rewards: 0.5989\n",
      "Iteration: 195, Train loss: 0.0390, rewards: 0.5977\n",
      "Iteration: 200, Train loss: 0.0903, rewards: 0.6063\n",
      "Eval:\n",
      "Hits@1: 0.5638, Hits@3: 0.5851, Hits@10: 0.5851, MRR: 0.5736\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: 0.1068, rewards: 0.6116\n",
      "Iteration: 210, Train loss: 0.0729, rewards: 0.6321\n",
      "Iteration: 215, Train loss: 0.0783, rewards: 0.6112\n",
      "Iteration: 220, Train loss: 0.0855, rewards: 0.5811\n",
      "Iteration: 225, Train loss: 0.0535, rewards: 0.6065\n",
      "Iteration: 230, Train loss: 0.0551, rewards: 0.6082\n",
      "Iteration: 235, Train loss: 0.0972, rewards: 0.6277\n",
      "Iteration: 240, Train loss: 0.0702, rewards: 0.6024\n",
      "Iteration: 245, Train loss: 0.0038, rewards: 0.6076\n",
      "Iteration: 250, Train loss: 0.0731, rewards: 0.5937\n",
      "Eval:\n",
      "Hits@1: 0.5691, Hits@3: 0.5745, Hits@10: 0.5798, MRR: 0.5731\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: 0.0650, rewards: 0.6050\n",
      "Iteration: 260, Train loss: 0.0800, rewards: 0.6321\n",
      "Iteration: 265, Train loss: 0.0373, rewards: 0.5915\n",
      "Iteration: 270, Train loss: 0.0784, rewards: 0.6432\n",
      "Iteration: 275, Train loss: 0.0405, rewards: 0.6179\n",
      "Iteration: 280, Train loss: 0.0454, rewards: 0.5683\n",
      "Iteration: 285, Train loss: 0.0065, rewards: 0.5960\n",
      "Iteration: 290, Train loss: -0.0249, rewards: 0.6444\n",
      "Iteration: 295, Train loss: 0.0291, rewards: 0.6158\n",
      "Iteration: 300, Train loss: 0.0504, rewards: 0.6131\n",
      "Eval:\n",
      "Hits@1: 0.5585, Hits@3: 0.5745, Hits@10: 0.5851, MRR: 0.5683\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: 0.0624, rewards: 0.5927\n",
      "Iteration: 310, Train loss: 0.0525, rewards: 0.6360\n",
      "Iteration: 315, Train loss: 0.0906, rewards: 0.6107\n",
      "Iteration: 320, Train loss: 0.0490, rewards: 0.6493\n",
      "Iteration: 325, Train loss: 0.0779, rewards: 0.6193\n",
      "Iteration: 330, Train loss: 0.0655, rewards: 0.6328\n",
      "Iteration: 335, Train loss: 0.0612, rewards: 0.6274\n",
      "Iteration: 340, Train loss: 0.0217, rewards: 0.6254\n",
      "Iteration: 345, Train loss: 0.0293, rewards: 0.6216\n",
      "Iteration: 350, Train loss: 0.0129, rewards: 0.6314\n",
      "Eval:\n",
      "Hits@1: 0.5638, Hits@3: 0.6011, Hits@10: 0.6064, MRR: 0.5833\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: 0.0482, rewards: 0.6447\n",
      "Iteration: 360, Train loss: 0.0427, rewards: 0.6264\n",
      "Iteration: 365, Train loss: 0.0454, rewards: 0.6390\n",
      "Iteration: 370, Train loss: 0.0593, rewards: 0.6237\n",
      "Iteration: 375, Train loss: 0.0499, rewards: 0.6056\n",
      "Iteration: 380, Train loss: 0.0559, rewards: 0.6161\n",
      "Iteration: 385, Train loss: 0.0058, rewards: 0.6160\n",
      "Iteration: 390, Train loss: 0.0638, rewards: 0.6424\n",
      "Iteration: 395, Train loss: 0.0649, rewards: 0.6064\n",
      "Iteration: 400, Train loss: 0.0101, rewards: 0.6595\n",
      "Eval:\n",
      "Hits@1: 0.5691, Hits@3: 0.6277, Hits@10: 0.6436, MRR: 0.5996\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: 0.0752, rewards: 0.5700\n",
      "Iteration: 410, Train loss: 0.0515, rewards: 0.5885\n",
      "Iteration: 415, Train loss: 0.0454, rewards: 0.6242\n",
      "Iteration: 420, Train loss: 0.0295, rewards: 0.6266\n",
      "Iteration: 425, Train loss: 0.0936, rewards: 0.6015\n",
      "Iteration: 430, Train loss: 0.0726, rewards: 0.6562\n",
      "Iteration: 435, Train loss: 0.0642, rewards: 0.6133\n",
      "Iteration: 440, Train loss: 0.1000, rewards: 0.6329\n",
      "Iteration: 445, Train loss: 0.0620, rewards: 0.6084\n",
      "Iteration: 450, Train loss: 0.0156, rewards: 0.6250\n",
      "Eval:\n",
      "Hits@1: 0.5745, Hits@3: 0.6064, Hits@10: 0.6064, MRR: 0.5887\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: 0.1305, rewards: 0.6228\n",
      "Iteration: 460, Train loss: 0.0973, rewards: 0.6041\n",
      "Iteration: 465, Train loss: 0.0268, rewards: 0.5780\n",
      "Iteration: 470, Train loss: 0.0695, rewards: 0.6205\n",
      "Iteration: 475, Train loss: 0.0522, rewards: 0.5991\n",
      "Iteration: 480, Train loss: 0.0615, rewards: 0.5932\n",
      "Iteration: 485, Train loss: 0.0535, rewards: 0.5974\n",
      "Iteration: 490, Train loss: 0.0685, rewards: 0.6147\n",
      "Iteration: 495, Train loss: 0.0834, rewards: 0.6585\n",
      "Iteration: 500, Train loss: 0.0166, rewards: 0.5691\n",
      "Eval:\n",
      "Hits@1: 0.5745, Hits@3: 0.5798, Hits@10: 0.5851, MRR: 0.5785\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: 0.0817, rewards: 0.6361\n",
      "Iteration: 510, Train loss: 0.0275, rewards: 0.6254\n",
      "Iteration: 515, Train loss: 0.0006, rewards: 0.6195\n",
      "Iteration: 520, Train loss: 0.0625, rewards: 0.6294\n",
      "Iteration: 525, Train loss: 0.1150, rewards: 0.6155\n",
      "Iteration: 530, Train loss: 0.0671, rewards: 0.6740\n",
      "Iteration: 535, Train loss: 0.0422, rewards: 0.6631\n",
      "Iteration: 540, Train loss: 0.1305, rewards: 0.6212\n",
      "Iteration: 545, Train loss: 0.1255, rewards: 0.6239\n",
      "Iteration: 550, Train loss: 0.0867, rewards: 0.6477\n",
      "Eval:\n",
      "Hits@1: 0.5904, Hits@3: 0.6223, Hits@10: 0.6277, MRR: 0.6071\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: 0.0940, rewards: 0.6231\n",
      "Iteration: 560, Train loss: 0.0539, rewards: 0.6325\n",
      "Iteration: 565, Train loss: 0.1161, rewards: 0.6372\n",
      "Iteration: 570, Train loss: 0.0769, rewards: 0.6454\n",
      "Iteration: 575, Train loss: 0.0861, rewards: 0.6560\n",
      "Iteration: 580, Train loss: 0.0452, rewards: 0.6465\n",
      "Iteration: 585, Train loss: 0.1024, rewards: 0.6340\n",
      "Iteration: 590, Train loss: 0.1036, rewards: 0.6266\n",
      "Iteration: 595, Train loss: 0.0657, rewards: 0.6414\n",
      "Iteration: 600, Train loss: 0.0925, rewards: 0.6329\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6277, Hits@10: 0.6277, MRR: 0.6117\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: 0.1212, rewards: 0.6242\n",
      "Iteration: 610, Train loss: 0.0662, rewards: 0.6367\n",
      "Iteration: 615, Train loss: 0.0882, rewards: 0.6573\n",
      "Iteration: 620, Train loss: 0.0945, rewards: 0.6308\n",
      "Iteration: 625, Train loss: 0.0507, rewards: 0.6436\n",
      "Iteration: 630, Train loss: 0.0710, rewards: 0.6530\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 635, Train loss: 0.0641, rewards: 0.6643\n",
      "Iteration: 640, Train loss: 0.0760, rewards: 0.6232\n",
      "Iteration: 645, Train loss: 0.0690, rewards: 0.6346\n",
      "Iteration: 650, Train loss: 0.0891, rewards: 0.6409\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6277, Hits@10: 0.6383, MRR: 0.6144\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: 0.0916, rewards: 0.6589\n",
      "Iteration: 660, Train loss: 0.0783, rewards: 0.6540\n",
      "Iteration: 665, Train loss: 0.0585, rewards: 0.6343\n",
      "Iteration: 670, Train loss: 0.0832, rewards: 0.6767\n",
      "Iteration: 675, Train loss: 0.0976, rewards: 0.6454\n",
      "Iteration: 680, Train loss: 0.0604, rewards: 0.6390\n",
      "Iteration: 685, Train loss: 0.1044, rewards: 0.6524\n",
      "Iteration: 690, Train loss: 0.0517, rewards: 0.6244\n",
      "Iteration: 695, Train loss: 0.0749, rewards: 0.6396\n",
      "Iteration: 700, Train loss: 0.0808, rewards: 0.6783\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6277, Hits@10: 0.6330, MRR: 0.6142\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: 0.0699, rewards: 0.6702\n",
      "Iteration: 710, Train loss: 0.0550, rewards: 0.6451\n",
      "Iteration: 715, Train loss: 0.0999, rewards: 0.6271\n",
      "Iteration: 720, Train loss: 0.0583, rewards: 0.6085\n",
      "Iteration: 725, Train loss: 0.0610, rewards: 0.6675\n",
      "Iteration: 730, Train loss: -0.0142, rewards: 0.6020\n",
      "Iteration: 735, Train loss: -0.0039, rewards: 0.6800\n",
      "Iteration: 740, Train loss: 0.0143, rewards: 0.6353\n",
      "Iteration: 745, Train loss: -0.0038, rewards: 0.6420\n",
      "Iteration: 750, Train loss: 0.0235, rewards: 0.6766\n",
      "Eval:\n",
      "Hits@1: 0.5904, Hits@3: 0.6223, Hits@10: 0.6277, MRR: 0.6051\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: 0.0050, rewards: 0.6259\n",
      "Iteration: 760, Train loss: -0.0392, rewards: 0.6349\n",
      "Iteration: 765, Train loss: 0.0011, rewards: 0.6184\n",
      "Iteration: 770, Train loss: 0.0110, rewards: 0.6260\n",
      "Iteration: 775, Train loss: 0.0579, rewards: 0.6483\n",
      "Iteration: 780, Train loss: -0.0018, rewards: 0.6529\n",
      "Iteration: 785, Train loss: 0.0056, rewards: 0.6797\n",
      "Iteration: 790, Train loss: -0.0311, rewards: 0.6359\n",
      "Iteration: 795, Train loss: 0.0206, rewards: 0.6372\n",
      "Iteration: 800, Train loss: -0.0208, rewards: 0.6548\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6330, Hits@10: 0.6436, MRR: 0.6174\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -0.0241, rewards: 0.6251\n",
      "Iteration: 810, Train loss: 0.0164, rewards: 0.6492\n",
      "Iteration: 815, Train loss: -0.0167, rewards: 0.6753\n",
      "Iteration: 820, Train loss: 0.0354, rewards: 0.6642\n",
      "Iteration: 825, Train loss: 0.0154, rewards: 0.6537\n",
      "Iteration: 830, Train loss: 0.0006, rewards: 0.6967\n",
      "Iteration: 835, Train loss: 0.0474, rewards: 0.6424\n",
      "Iteration: 840, Train loss: 0.0752, rewards: 0.6722\n",
      "Iteration: 845, Train loss: 0.0274, rewards: 0.6296\n",
      "Iteration: 850, Train loss: -0.0093, rewards: 0.6346\n",
      "Eval:\n",
      "Hits@1: 0.5957, Hits@3: 0.6383, Hits@10: 0.6489, MRR: 0.6142\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -0.0021, rewards: 0.6591\n",
      "Iteration: 860, Train loss: 0.0192, rewards: 0.6314\n",
      "Iteration: 865, Train loss: 0.0220, rewards: 0.6754\n",
      "Iteration: 870, Train loss: 0.0361, rewards: 0.6798\n",
      "Iteration: 875, Train loss: 0.0145, rewards: 0.6400\n",
      "Iteration: 880, Train loss: 0.0353, rewards: 0.6458\n",
      "Iteration: 885, Train loss: 0.0249, rewards: 0.6133\n",
      "Iteration: 890, Train loss: -0.0241, rewards: 0.7002\n",
      "Iteration: 895, Train loss: 0.0194, rewards: 0.6503\n",
      "Iteration: 900, Train loss: 0.1041, rewards: 0.6688\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6330, Hits@10: 0.6383, MRR: 0.6154\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -0.0016, rewards: 0.6811\n",
      "Iteration: 910, Train loss: 0.0205, rewards: 0.6514\n",
      "Iteration: 915, Train loss: -0.0118, rewards: 0.6733\n",
      "Iteration: 920, Train loss: -0.0345, rewards: 0.6436\n",
      "Iteration: 925, Train loss: -0.0220, rewards: 0.6631\n",
      "Iteration: 930, Train loss: -0.0193, rewards: 0.6647\n",
      "Iteration: 935, Train loss: 0.0020, rewards: 0.6321\n",
      "Iteration: 940, Train loss: 0.0323, rewards: 0.6331\n",
      "Iteration: 945, Train loss: 0.0483, rewards: 0.6619\n",
      "Iteration: 950, Train loss: 0.0583, rewards: 0.6675\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6277, Hits@10: 0.6330, MRR: 0.6141\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: 0.0679, rewards: 0.6508\n",
      "Iteration: 960, Train loss: 0.0069, rewards: 0.6519\n",
      "Iteration: 965, Train loss: -0.0002, rewards: 0.6569\n",
      "Iteration: 970, Train loss: 0.0023, rewards: 0.6191\n",
      "Iteration: 975, Train loss: 0.0148, rewards: 0.6229\n",
      "Iteration: 980, Train loss: -0.0191, rewards: 0.6461\n",
      "Iteration: 985, Train loss: -0.0237, rewards: 0.6689\n",
      "Iteration: 990, Train loss: 0.0450, rewards: 0.6680\n",
      "Iteration: 995, Train loss: 0.0006, rewards: 0.6636\n",
      "Iteration: 1000, Train loss: 0.0761, rewards: 0.6744\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6277, Hits@10: 0.6330, MRR: 0.6210\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: 0.0115, rewards: 0.6214\n",
      "Iteration: 1010, Train loss: -0.0534, rewards: 0.6684\n",
      "Iteration: 1015, Train loss: -0.0540, rewards: 0.6775\n",
      "Iteration: 1020, Train loss: 0.0065, rewards: 0.6687\n",
      "Iteration: 1025, Train loss: 0.0044, rewards: 0.6173\n",
      "Iteration: 1030, Train loss: -0.0340, rewards: 0.6542\n",
      "Iteration: 1035, Train loss: -0.0180, rewards: 0.6590\n",
      "Iteration: 1040, Train loss: 0.0197, rewards: 0.6106\n",
      "Iteration: 1045, Train loss: 0.0438, rewards: 0.6416\n",
      "Iteration: 1050, Train loss: 0.0172, rewards: 0.6589\n",
      "Eval:\n",
      "Hits@1: 0.5957, Hits@3: 0.6383, Hits@10: 0.6436, MRR: 0.6154\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: 0.0530, rewards: 0.6693\n",
      "Iteration: 1060, Train loss: 0.0379, rewards: 0.6446\n",
      "Iteration: 1065, Train loss: -0.0017, rewards: 0.6590\n",
      "Iteration: 1070, Train loss: -0.0195, rewards: 0.6739\n",
      "Iteration: 1075, Train loss: -0.0278, rewards: 0.6404\n",
      "Iteration: 1080, Train loss: -0.0148, rewards: 0.6872\n",
      "Iteration: 1085, Train loss: 0.0032, rewards: 0.6633\n",
      "Iteration: 1090, Train loss: -0.0072, rewards: 0.6651\n",
      "Iteration: 1095, Train loss: 0.0572, rewards: 0.6664\n",
      "Iteration: 1100, Train loss: 0.0136, rewards: 0.6509\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6383, Hits@10: 0.6436, MRR: 0.6212\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: 0.0346, rewards: 0.6859\n",
      "Iteration: 1110, Train loss: -0.0626, rewards: 0.6455\n",
      "Iteration: 1115, Train loss: 0.0146, rewards: 0.6510\n",
      "Iteration: 1120, Train loss: -0.0158, rewards: 0.6624\n",
      "Iteration: 1125, Train loss: 0.0397, rewards: 0.6676\n",
      "Iteration: 1130, Train loss: -0.0137, rewards: 0.6587\n",
      "Iteration: 1135, Train loss: 0.0560, rewards: 0.6626\n",
      "Iteration: 1140, Train loss: 0.0236, rewards: 0.6733\n",
      "Iteration: 1145, Train loss: 0.0318, rewards: 0.6674\n",
      "Iteration: 1150, Train loss: -0.0132, rewards: 0.6910\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6436, Hits@10: 0.6489, MRR: 0.6258\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: 0.0257, rewards: 0.6597\n",
      "Iteration: 1160, Train loss: -0.0137, rewards: 0.6701\n",
      "Iteration: 1165, Train loss: -0.0240, rewards: 0.6781\n",
      "Iteration: 1170, Train loss: -0.0253, rewards: 0.6534\n",
      "Iteration: 1175, Train loss: -0.0116, rewards: 0.6420\n",
      "Iteration: 1180, Train loss: 0.0225, rewards: 0.7002\n",
      "Iteration: 1185, Train loss: 0.0695, rewards: 0.6839\n",
      "Iteration: 1190, Train loss: -0.0183, rewards: 0.6717\n",
      "Iteration: 1195, Train loss: -0.0642, rewards: 0.6397\n",
      "Iteration: 1200, Train loss: -0.0186, rewards: 0.6728\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6330, Hits@10: 0.6489, MRR: 0.6229\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -0.0317, rewards: 0.6313\n",
      "Iteration: 1210, Train loss: 0.0223, rewards: 0.6645\n",
      "Iteration: 1215, Train loss: -0.0002, rewards: 0.6597\n",
      "Iteration: 1220, Train loss: -0.0018, rewards: 0.6512\n",
      "Iteration: 1225, Train loss: 0.0299, rewards: 0.6628\n",
      "Iteration: 1230, Train loss: -0.0335, rewards: 0.6572\n",
      "Iteration: 1235, Train loss: 0.0379, rewards: 0.6853\n",
      "Iteration: 1240, Train loss: 0.0083, rewards: 0.6492\n",
      "Iteration: 1245, Train loss: -0.0739, rewards: 0.6507\n",
      "Iteration: 1250, Train loss: -0.0122, rewards: 0.6790\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6277, Hits@10: 0.6436, MRR: 0.6237\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1255, Train loss: 0.0203, rewards: 0.6713\n",
      "Iteration: 1260, Train loss: -0.0515, rewards: 0.6724\n",
      "Iteration: 1265, Train loss: -0.0585, rewards: 0.6690\n",
      "Iteration: 1270, Train loss: -0.0073, rewards: 0.6633\n",
      "Iteration: 1275, Train loss: -0.0312, rewards: 0.6761\n",
      "Iteration: 1280, Train loss: -0.0429, rewards: 0.6866\n",
      "Iteration: 1285, Train loss: 0.0217, rewards: 0.6737\n",
      "Iteration: 1290, Train loss: 0.0146, rewards: 0.6569\n",
      "Iteration: 1295, Train loss: -0.0628, rewards: 0.6595\n",
      "Iteration: 1300, Train loss: -0.0684, rewards: 0.6798\n",
      "Eval:\n",
      "Hits@1: 0.6170, Hits@3: 0.6436, Hits@10: 0.6543, MRR: 0.6292\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -0.0229, rewards: 0.6889\n",
      "Iteration: 1310, Train loss: -0.0309, rewards: 0.6759\n",
      "Iteration: 1315, Train loss: -0.0471, rewards: 0.6879\n",
      "Iteration: 1320, Train loss: -0.0473, rewards: 0.6546\n",
      "Iteration: 1325, Train loss: 0.0033, rewards: 0.6663\n",
      "Iteration: 1330, Train loss: -0.0079, rewards: 0.6675\n",
      "Iteration: 1335, Train loss: -0.0090, rewards: 0.7123\n",
      "Iteration: 1340, Train loss: -0.0102, rewards: 0.6680\n",
      "Iteration: 1345, Train loss: -0.0229, rewards: 0.6612\n",
      "Iteration: 1350, Train loss: -0.0316, rewards: 0.6476\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6383, Hits@10: 0.6543, MRR: 0.6290\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -0.0370, rewards: 0.6555\n",
      "Iteration: 1360, Train loss: -0.0006, rewards: 0.6843\n",
      "Iteration: 1365, Train loss: -0.0100, rewards: 0.6450\n",
      "Iteration: 1370, Train loss: -0.0228, rewards: 0.6735\n",
      "Iteration: 1375, Train loss: -0.0589, rewards: 0.6563\n",
      "Iteration: 1380, Train loss: -0.0223, rewards: 0.6639\n",
      "Iteration: 1385, Train loss: -0.0385, rewards: 0.6604\n",
      "Iteration: 1390, Train loss: -0.0215, rewards: 0.6759\n",
      "Iteration: 1395, Train loss: -0.0528, rewards: 0.6755\n",
      "Iteration: 1400, Train loss: -0.0277, rewards: 0.6737\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6436, Hits@10: 0.6436, MRR: 0.6259\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -0.0061, rewards: 0.7045\n",
      "Iteration: 1410, Train loss: -0.0168, rewards: 0.7107\n",
      "Iteration: 1415, Train loss: -0.0260, rewards: 0.6751\n",
      "Iteration: 1420, Train loss: -0.0349, rewards: 0.6928\n",
      "Iteration: 1425, Train loss: 0.0058, rewards: 0.6953\n",
      "Iteration: 1430, Train loss: -0.0512, rewards: 0.6943\n",
      "Iteration: 1435, Train loss: -0.0320, rewards: 0.6673\n",
      "Iteration: 1440, Train loss: -0.0201, rewards: 0.6911\n",
      "Iteration: 1445, Train loss: 0.0219, rewards: 0.6859\n",
      "Iteration: 1450, Train loss: 0.0332, rewards: 0.6772\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6383, Hits@10: 0.6543, MRR: 0.6250\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -0.0431, rewards: 0.6543\n",
      "Iteration: 1460, Train loss: -0.0259, rewards: 0.6976\n",
      "Iteration: 1465, Train loss: -0.0554, rewards: 0.6663\n",
      "Iteration: 1470, Train loss: -0.0218, rewards: 0.6711\n",
      "Iteration: 1475, Train loss: 0.0308, rewards: 0.6760\n",
      "Iteration: 1480, Train loss: 0.0276, rewards: 0.6223\n",
      "Iteration: 1485, Train loss: -0.0554, rewards: 0.6787\n",
      "Iteration: 1490, Train loss: -0.0051, rewards: 0.6467\n",
      "Iteration: 1495, Train loss: -0.0693, rewards: 0.6700\n",
      "Iteration: 1500, Train loss: 0.0126, rewards: 0.6624\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6489, Hits@10: 0.6543, MRR: 0.6296\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -0.0645, rewards: 0.6551\n",
      "Iteration: 1510, Train loss: -0.0074, rewards: 0.6621\n",
      "Iteration: 1515, Train loss: -0.0398, rewards: 0.6478\n",
      "Iteration: 1520, Train loss: -0.0106, rewards: 0.6554\n",
      "Iteration: 1525, Train loss: -0.0831, rewards: 0.6902\n",
      "Iteration: 1530, Train loss: -0.0526, rewards: 0.6782\n",
      "Iteration: 1535, Train loss: -0.0430, rewards: 0.6928\n",
      "Iteration: 1540, Train loss: -0.0154, rewards: 0.6616\n",
      "Iteration: 1545, Train loss: -0.0027, rewards: 0.6809\n",
      "Iteration: 1550, Train loss: 0.0391, rewards: 0.7012\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6489, Hits@10: 0.6489, MRR: 0.6277\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.0300, rewards: 0.6367\n",
      "Iteration: 1560, Train loss: 0.0167, rewards: 0.6737\n",
      "Iteration: 1565, Train loss: -0.0300, rewards: 0.6979\n",
      "Iteration: 1570, Train loss: -0.0833, rewards: 0.6600\n",
      "Iteration: 1575, Train loss: -0.0379, rewards: 0.6500\n",
      "Iteration: 1580, Train loss: -0.0698, rewards: 0.6680\n",
      "Iteration: 1585, Train loss: -0.0561, rewards: 0.6653\n",
      "Iteration: 1590, Train loss: -0.0487, rewards: 0.7224\n",
      "Iteration: 1595, Train loss: 0.0226, rewards: 0.6799\n",
      "Iteration: 1600, Train loss: -0.0088, rewards: 0.6820\n",
      "Eval:\n",
      "Hits@1: 0.6117, Hits@3: 0.6436, Hits@10: 0.6436, MRR: 0.6259\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.0162, rewards: 0.6759\n",
      "Iteration: 1610, Train loss: -0.0111, rewards: 0.6725\n",
      "Iteration: 1615, Train loss: 0.0039, rewards: 0.6647\n",
      "Iteration: 1620, Train loss: 0.0330, rewards: 0.6662\n",
      "Iteration: 1625, Train loss: 0.0047, rewards: 0.6677\n",
      "Iteration: 1630, Train loss: -0.0203, rewards: 0.6728\n",
      "Iteration: 1635, Train loss: -0.0213, rewards: 0.6450\n",
      "Iteration: 1640, Train loss: -0.0542, rewards: 0.6598\n",
      "Iteration: 1645, Train loss: -0.0134, rewards: 0.6596\n",
      "Iteration: 1650, Train loss: -0.0260, rewards: 0.6750\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6383, Hits@10: 0.6543, MRR: 0.6240\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -0.0538, rewards: 0.6626\n",
      "Iteration: 1660, Train loss: -0.0199, rewards: 0.6307\n",
      "Iteration: 1665, Train loss: 0.0232, rewards: 0.6811\n",
      "Iteration: 1670, Train loss: -0.0207, rewards: 0.6880\n",
      "Iteration: 1675, Train loss: -0.0030, rewards: 0.6841\n",
      "Iteration: 1680, Train loss: 0.0051, rewards: 0.6537\n",
      "Iteration: 1685, Train loss: -0.0637, rewards: 0.6682\n",
      "Iteration: 1690, Train loss: -0.0505, rewards: 0.6407\n",
      "Iteration: 1695, Train loss: -0.0219, rewards: 0.6703\n",
      "Iteration: 1700, Train loss: -0.0651, rewards: 0.6838\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6436, Hits@10: 0.6489, MRR: 0.6241\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -0.0014, rewards: 0.6645\n",
      "Iteration: 1710, Train loss: -0.0240, rewards: 0.6862\n",
      "Iteration: 1715, Train loss: 0.0132, rewards: 0.6676\n",
      "Iteration: 1720, Train loss: -0.0415, rewards: 0.6592\n",
      "Iteration: 1725, Train loss: 0.0045, rewards: 0.6996\n",
      "Iteration: 1730, Train loss: -0.0609, rewards: 0.6643\n",
      "Iteration: 1735, Train loss: -0.0663, rewards: 0.6684\n",
      "Iteration: 1740, Train loss: -0.0026, rewards: 0.6737\n",
      "Iteration: 1745, Train loss: -0.0434, rewards: 0.6949\n",
      "Iteration: 1750, Train loss: -0.0061, rewards: 0.6983\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6330, Hits@10: 0.6436, MRR: 0.6169\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.0187, rewards: 0.6596\n",
      "Iteration: 1760, Train loss: -0.1042, rewards: 0.6536\n",
      "Iteration: 1765, Train loss: -0.0733, rewards: 0.6722\n",
      "Iteration: 1770, Train loss: 0.0222, rewards: 0.6768\n",
      "Iteration: 1775, Train loss: -0.0265, rewards: 0.6623\n",
      "Iteration: 1780, Train loss: -0.0048, rewards: 0.6709\n",
      "Iteration: 1785, Train loss: -0.0236, rewards: 0.6690\n",
      "Iteration: 1790, Train loss: 0.0261, rewards: 0.6609\n",
      "Iteration: 1795, Train loss: -0.0276, rewards: 0.6750\n",
      "Iteration: 1800, Train loss: -0.0001, rewards: 0.6655\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6383, Hits@10: 0.6436, MRR: 0.6221\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -0.0255, rewards: 0.6433\n",
      "Iteration: 1810, Train loss: -0.0793, rewards: 0.6907\n",
      "Iteration: 1815, Train loss: -0.0539, rewards: 0.6961\n",
      "Iteration: 1820, Train loss: -0.0287, rewards: 0.6619\n",
      "Iteration: 1825, Train loss: 0.0266, rewards: 0.6908\n",
      "Iteration: 1830, Train loss: -0.0162, rewards: 0.6694\n",
      "Iteration: 1835, Train loss: -0.0449, rewards: 0.6485\n",
      "Iteration: 1840, Train loss: -0.0117, rewards: 0.7002\n",
      "Iteration: 1845, Train loss: 0.0031, rewards: 0.6793\n",
      "Iteration: 1850, Train loss: 0.0305, rewards: 0.6668\n",
      "Eval:\n",
      "Hits@1: 0.6064, Hits@3: 0.6277, Hits@10: 0.6489, MRR: 0.6216\n",
      "------------------------------------------------------------\n",
      "Iteration: 1855, Train loss: 0.0688, rewards: 0.6889\n",
      "Iteration: 1860, Train loss: 0.0182, rewards: 0.6894\n",
      "Iteration: 1865, Train loss: 0.0297, rewards: 0.6381\n",
      "Iteration: 1870, Train loss: 0.0005, rewards: 0.6620\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1875, Train loss: 0.0774, rewards: 0.6903\n",
      "Iteration: 1880, Train loss: -0.0182, rewards: 0.6604\n",
      "Iteration: 1885, Train loss: -0.0149, rewards: 0.7059\n",
      "Iteration: 1890, Train loss: -0.0325, rewards: 0.6598\n",
      "Iteration: 1895, Train loss: 0.0635, rewards: 0.6575\n",
      "Iteration: 1900, Train loss: 0.0400, rewards: 0.6808\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6330, Hits@10: 0.6383, MRR: 0.6170\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: 0.0248, rewards: 0.6789\n",
      "Iteration: 1910, Train loss: -0.0328, rewards: 0.6620\n",
      "Iteration: 1915, Train loss: 0.0007, rewards: 0.6841\n",
      "Iteration: 1920, Train loss: 0.0032, rewards: 0.6814\n",
      "Iteration: 1925, Train loss: 0.0169, rewards: 0.6463\n",
      "Iteration: 1930, Train loss: -0.0185, rewards: 0.6766\n",
      "Iteration: 1935, Train loss: -0.0642, rewards: 0.6828\n",
      "Iteration: 1940, Train loss: -0.0273, rewards: 0.6955\n",
      "Iteration: 1945, Train loss: -0.0203, rewards: 0.6785\n",
      "Iteration: 1950, Train loss: -0.0766, rewards: 0.6628\n",
      "Eval:\n",
      "Hits@1: 0.6011, Hits@3: 0.6330, Hits@10: 0.6436, MRR: 0.6191\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -0.0210, rewards: 0.6732\n",
      "Iteration: 1960, Train loss: -0.0446, rewards: 0.6879\n",
      "Iteration: 1965, Train loss: 0.0046, rewards: 0.6344\n",
      "Iteration: 1970, Train loss: -0.0285, rewards: 0.6707\n",
      "Iteration: 1975, Train loss: -0.0043, rewards: 0.6919\n",
      "Iteration: 1980, Train loss: -0.0025, rewards: 0.6693\n",
      "Iteration: 1985, Train loss: -0.0286, rewards: 0.6508\n",
      "Iteration: 1990, Train loss: 0.0321, rewards: 0.6842\n",
      "Iteration: 1995, Train loss: -0.0520, rewards: 0.6573\n",
      "Iteration: 2000, Train loss: -0.0220, rewards: 0.6746\n",
      "Eval:\n",
      "Hits@1: 0.6170, Hits@3: 0.6383, Hits@10: 0.6489, MRR: 0.6273\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personborninlocation//test_beam/ ]\n",
      "Hits@1: 0.4611, Hits@3: 0.7306, Hits@10: 0.8031, MRR: 0.6058\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.7545280712379158 (193 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 23:54:08,578]\u001b[0m Trial 2 finished with value: 0.7545280712379158 and parameters: {'lr': 0.0031517989645742533, 'bs': 123, 'b': 0.09730259545934583, 'l': 0.26792311723383533, 'ee': 50}. Best is trial 1 with value: 0.765713388511316.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.7652, rewards: 0.3115\n",
      "Iteration: 20, Train loss: -0.9073, rewards: 0.4142\n",
      "Iteration: 30, Train loss: -0.8289, rewards: 0.3920\n",
      "Iteration: 40, Train loss: -0.8347, rewards: 0.4053\n",
      "Iteration: 50, Train loss: -0.9590, rewards: 0.4592\n",
      "Iteration: 60, Train loss: -0.9604, rewards: 0.4572\n",
      "Iteration: 70, Train loss: -0.8885, rewards: 0.4070\n",
      "Iteration: 80, Train loss: -0.9352, rewards: 0.4875\n",
      "Iteration: 90, Train loss: -0.9184, rewards: 0.4442\n",
      "Iteration: 100, Train loss: -0.8844, rewards: 0.3708\n",
      "Eval:\n",
      "Hits@1: 0.5319, Hits@3: 0.5372, Hits@10: 0.5585, MRR: 0.5390\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.9110, rewards: 0.4132\n",
      "Iteration: 120, Train loss: -0.9786, rewards: 0.4512\n",
      "Iteration: 130, Train loss: -0.9469, rewards: 0.4730\n",
      "Iteration: 140, Train loss: -0.8958, rewards: 0.4502\n",
      "Iteration: 150, Train loss: -0.9441, rewards: 0.4398\n",
      "Iteration: 160, Train loss: -0.8531, rewards: 0.4693\n",
      "Iteration: 170, Train loss: -0.7777, rewards: 0.4493\n",
      "Iteration: 180, Train loss: -0.9394, rewards: 0.4917\n",
      "Iteration: 190, Train loss: -0.8932, rewards: 0.4522\n",
      "Iteration: 200, Train loss: -0.9583, rewards: 0.4308\n",
      "Eval:\n",
      "Hits@1: 0.5426, Hits@3: 0.5532, Hits@10: 0.5585, MRR: 0.5480\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -1.0392, rewards: 0.4222\n",
      "Iteration: 220, Train loss: -0.9551, rewards: 0.4642\n",
      "Iteration: 230, Train loss: -0.8568, rewards: 0.4955\n",
      "Iteration: 240, Train loss: -0.8832, rewards: 0.4670\n",
      "Iteration: 250, Train loss: -0.9580, rewards: 0.4007\n",
      "Iteration: 260, Train loss: -0.9283, rewards: 0.4832\n",
      "Iteration: 270, Train loss: -0.9343, rewards: 0.4712\n",
      "Iteration: 280, Train loss: -0.9124, rewards: 0.3955\n",
      "Iteration: 290, Train loss: -0.7873, rewards: 0.4658\n",
      "Iteration: 300, Train loss: -0.9464, rewards: 0.4988\n",
      "Eval:\n",
      "Hits@1: 0.5426, Hits@3: 0.5532, Hits@10: 0.5585, MRR: 0.5490\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.9106, rewards: 0.4175\n",
      "Iteration: 320, Train loss: -0.9163, rewards: 0.4415\n",
      "Iteration: 330, Train loss: -0.9816, rewards: 0.4150\n",
      "Iteration: 340, Train loss: -0.8900, rewards: 0.4730\n",
      "Iteration: 350, Train loss: -0.9248, rewards: 0.4597\n",
      "Iteration: 360, Train loss: -0.9918, rewards: 0.4592\n",
      "Iteration: 370, Train loss: -0.9516, rewards: 0.4795\n",
      "Iteration: 380, Train loss: -0.9950, rewards: 0.4125\n",
      "Iteration: 390, Train loss: -0.9792, rewards: 0.4445\n",
      "Iteration: 400, Train loss: -0.8751, rewards: 0.4508\n",
      "Eval:\n",
      "Hits@1: 0.5426, Hits@3: 0.5638, Hits@10: 0.5798, MRR: 0.5531\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.8569, rewards: 0.5063\n",
      "Iteration: 420, Train loss: -1.0144, rewards: 0.4700\n",
      "Iteration: 430, Train loss: -0.9121, rewards: 0.4778\n",
      "Iteration: 440, Train loss: -0.9190, rewards: 0.4737\n",
      "Iteration: 450, Train loss: -0.8554, rewards: 0.4137\n",
      "Iteration: 460, Train loss: -0.8173, rewards: 0.5257\n",
      "Iteration: 470, Train loss: -0.8703, rewards: 0.4897\n",
      "Iteration: 480, Train loss: -0.9298, rewards: 0.4782\n",
      "Iteration: 490, Train loss: -0.8020, rewards: 0.4298\n",
      "Iteration: 500, Train loss: -0.8983, rewards: 0.4653\n",
      "Eval:\n",
      "Hits@1: 0.5426, Hits@3: 0.5532, Hits@10: 0.5691, MRR: 0.5499\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.9462, rewards: 0.4375\n",
      "Iteration: 520, Train loss: -0.9277, rewards: 0.4583\n",
      "Iteration: 530, Train loss: -0.8747, rewards: 0.4420\n",
      "Iteration: 540, Train loss: -0.9943, rewards: 0.4593\n",
      "Iteration: 550, Train loss: -0.8792, rewards: 0.5010\n",
      "Iteration: 560, Train loss: -1.0263, rewards: 0.4703\n",
      "Iteration: 570, Train loss: -0.9753, rewards: 0.4648\n",
      "Iteration: 580, Train loss: -0.8970, rewards: 0.4750\n",
      "Iteration: 590, Train loss: -0.9229, rewards: 0.5122\n",
      "Iteration: 600, Train loss: -0.9702, rewards: 0.4422\n",
      "Eval:\n",
      "Hits@1: 0.5372, Hits@3: 0.5532, Hits@10: 0.5638, MRR: 0.5465\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -1.0401, rewards: 0.4267\n",
      "Iteration: 620, Train loss: -0.9861, rewards: 0.5107\n",
      "Iteration: 630, Train loss: -0.9585, rewards: 0.4558\n",
      "Iteration: 640, Train loss: -0.9900, rewards: 0.4448\n",
      "Iteration: 650, Train loss: -0.9965, rewards: 0.4593\n",
      "Iteration: 660, Train loss: -0.9749, rewards: 0.4515\n",
      "Iteration: 670, Train loss: -0.9467, rewards: 0.4797\n",
      "Iteration: 680, Train loss: -0.9832, rewards: 0.5018\n",
      "Iteration: 690, Train loss: -0.9862, rewards: 0.4947\n",
      "Iteration: 700, Train loss: -0.9510, rewards: 0.4535\n",
      "Eval:\n",
      "Hits@1: 0.5532, Hits@3: 0.5691, Hits@10: 0.5691, MRR: 0.5599\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.9168, rewards: 0.4327\n",
      "Iteration: 720, Train loss: -0.9685, rewards: 0.4238\n",
      "Iteration: 730, Train loss: -0.9023, rewards: 0.4670\n",
      "Iteration: 740, Train loss: -0.8741, rewards: 0.4720\n",
      "Iteration: 750, Train loss: -0.9154, rewards: 0.5425\n",
      "Iteration: 760, Train loss: -1.0221, rewards: 0.4832\n",
      "Iteration: 770, Train loss: -1.0584, rewards: 0.4920\n",
      "Iteration: 780, Train loss: -0.9541, rewards: 0.4590\n",
      "Iteration: 790, Train loss: -0.8002, rewards: 0.4557\n",
      "Iteration: 800, Train loss: -0.9075, rewards: 0.4613\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5585, Hits@10: 0.5638, MRR: 0.5523\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -0.9137, rewards: 0.4800\n",
      "Iteration: 820, Train loss: -0.8797, rewards: 0.5002\n",
      "Iteration: 830, Train loss: -0.8682, rewards: 0.4688\n",
      "Iteration: 840, Train loss: -0.9691, rewards: 0.4630\n",
      "Iteration: 850, Train loss: -0.9846, rewards: 0.4700\n",
      "Iteration: 860, Train loss: -0.9031, rewards: 0.4813\n",
      "Iteration: 870, Train loss: -0.9301, rewards: 0.3953\n",
      "Iteration: 880, Train loss: -0.8613, rewards: 0.4707\n",
      "Iteration: 890, Train loss: -0.9931, rewards: 0.4625\n",
      "Iteration: 900, Train loss: -0.9272, rewards: 0.5080\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5585, Hits@10: 0.5638, MRR: 0.5532\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.9462, rewards: 0.4600\n",
      "Iteration: 920, Train loss: -0.8461, rewards: 0.5090\n",
      "Iteration: 930, Train loss: -1.0581, rewards: 0.4403\n",
      "Iteration: 940, Train loss: -1.0311, rewards: 0.4465\n",
      "Iteration: 950, Train loss: -0.9423, rewards: 0.4663\n",
      "Iteration: 960, Train loss: -1.0125, rewards: 0.4855\n",
      "Iteration: 970, Train loss: -0.8615, rewards: 0.4380\n",
      "Iteration: 980, Train loss: -0.9683, rewards: 0.4418\n",
      "Iteration: 990, Train loss: -0.9162, rewards: 0.4775\n",
      "Iteration: 1000, Train loss: -0.9117, rewards: 0.5147\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5691, Hits@10: 0.5851, MRR: 0.5587\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.8861, rewards: 0.4547\n",
      "Iteration: 1020, Train loss: -0.9240, rewards: 0.4948\n",
      "Iteration: 1030, Train loss: -0.9140, rewards: 0.4908\n",
      "Iteration: 1040, Train loss: -0.9060, rewards: 0.4802\n",
      "Iteration: 1050, Train loss: -0.9553, rewards: 0.4687\n",
      "Iteration: 1060, Train loss: -0.9979, rewards: 0.4497\n",
      "Iteration: 1070, Train loss: -0.8948, rewards: 0.5388\n",
      "Iteration: 1080, Train loss: -0.9725, rewards: 0.4653\n",
      "Iteration: 1090, Train loss: -0.9626, rewards: 0.4957\n",
      "Iteration: 1100, Train loss: -1.0067, rewards: 0.5083\n",
      "Eval:\n",
      "Hits@1: 0.5532, Hits@3: 0.5638, Hits@10: 0.5691, MRR: 0.5576\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.9722, rewards: 0.4832\n",
      "Iteration: 1120, Train loss: -0.9595, rewards: 0.5182\n",
      "Iteration: 1130, Train loss: -1.0044, rewards: 0.5053\n",
      "Iteration: 1140, Train loss: -0.9000, rewards: 0.4645\n",
      "Iteration: 1150, Train loss: -1.0349, rewards: 0.4998\n",
      "Iteration: 1160, Train loss: -0.8528, rewards: 0.4965\n",
      "Iteration: 1170, Train loss: -1.0009, rewards: 0.4303\n",
      "Iteration: 1180, Train loss: -0.9040, rewards: 0.5078\n",
      "Iteration: 1190, Train loss: -0.8834, rewards: 0.4788\n",
      "Iteration: 1200, Train loss: -0.9331, rewards: 0.4753\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5691, Hits@10: 0.5798, MRR: 0.5592\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.9005, rewards: 0.4468\n",
      "Iteration: 1220, Train loss: -0.8630, rewards: 0.5120\n",
      "Iteration: 1230, Train loss: -0.8975, rewards: 0.4933\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.8729, rewards: 0.4728\n",
      "Iteration: 1250, Train loss: -0.8320, rewards: 0.4980\n",
      "Iteration: 1260, Train loss: -1.0321, rewards: 0.4702\n",
      "Iteration: 1270, Train loss: -0.9300, rewards: 0.4780\n",
      "Iteration: 1280, Train loss: -1.0128, rewards: 0.4677\n",
      "Iteration: 1290, Train loss: -0.8463, rewards: 0.4973\n",
      "Iteration: 1300, Train loss: -1.0519, rewards: 0.4045\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5638, Hits@10: 0.5798, MRR: 0.5577\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.9566, rewards: 0.4968\n",
      "Iteration: 1320, Train loss: -0.9419, rewards: 0.4462\n",
      "Iteration: 1330, Train loss: -0.8721, rewards: 0.5043\n",
      "Iteration: 1340, Train loss: -0.9323, rewards: 0.4582\n",
      "Iteration: 1350, Train loss: -1.0249, rewards: 0.5443\n",
      "Iteration: 1360, Train loss: -1.0415, rewards: 0.4875\n",
      "Iteration: 1370, Train loss: -0.9352, rewards: 0.5357\n",
      "Iteration: 1380, Train loss: -1.0007, rewards: 0.4905\n",
      "Iteration: 1390, Train loss: -0.9063, rewards: 0.4775\n",
      "Iteration: 1400, Train loss: -0.9478, rewards: 0.4000\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5585, Hits@10: 0.5691, MRR: 0.5545\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.9644, rewards: 0.4950\n",
      "Iteration: 1420, Train loss: -0.9935, rewards: 0.5037\n",
      "Iteration: 1430, Train loss: -0.9457, rewards: 0.5002\n",
      "Iteration: 1440, Train loss: -0.9488, rewards: 0.5097\n",
      "Iteration: 1450, Train loss: -0.9320, rewards: 0.5350\n",
      "Iteration: 1460, Train loss: -0.9640, rewards: 0.4440\n",
      "Iteration: 1470, Train loss: -0.9262, rewards: 0.4882\n",
      "Iteration: 1480, Train loss: -0.9901, rewards: 0.4807\n",
      "Iteration: 1490, Train loss: -0.8596, rewards: 0.5060\n",
      "Iteration: 1500, Train loss: -1.0094, rewards: 0.4270\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5532, Hits@10: 0.5585, MRR: 0.5510\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.9040, rewards: 0.5172\n",
      "Iteration: 1520, Train loss: -0.9522, rewards: 0.5047\n",
      "Iteration: 1530, Train loss: -0.9741, rewards: 0.4573\n",
      "Iteration: 1540, Train loss: -0.8872, rewards: 0.5158\n",
      "Iteration: 1550, Train loss: -0.9878, rewards: 0.4760\n",
      "Iteration: 1560, Train loss: -0.9819, rewards: 0.4715\n",
      "Iteration: 1570, Train loss: -0.9334, rewards: 0.5203\n",
      "Iteration: 1580, Train loss: -0.9236, rewards: 0.4092\n",
      "Iteration: 1590, Train loss: -0.9645, rewards: 0.4765\n",
      "Iteration: 1600, Train loss: -0.8606, rewards: 0.5453\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5638, Hits@10: 0.5798, MRR: 0.5556\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.9306, rewards: 0.4635\n",
      "Iteration: 1620, Train loss: -0.9540, rewards: 0.5048\n",
      "Iteration: 1630, Train loss: -0.9122, rewards: 0.4652\n",
      "Iteration: 1640, Train loss: -0.9027, rewards: 0.4632\n",
      "Iteration: 1650, Train loss: -1.0765, rewards: 0.4923\n",
      "Iteration: 1660, Train loss: -0.9561, rewards: 0.5268\n",
      "Iteration: 1670, Train loss: -0.9290, rewards: 0.4857\n",
      "Iteration: 1680, Train loss: -0.9901, rewards: 0.5028\n",
      "Iteration: 1690, Train loss: -0.8757, rewards: 0.4730\n",
      "Iteration: 1700, Train loss: -0.9083, rewards: 0.4887\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5532, Hits@10: 0.5691, MRR: 0.5525\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -1.0291, rewards: 0.4953\n",
      "Iteration: 1720, Train loss: -1.0086, rewards: 0.5002\n",
      "Iteration: 1730, Train loss: -0.9267, rewards: 0.4875\n",
      "Iteration: 1740, Train loss: -0.8419, rewards: 0.4535\n",
      "Iteration: 1750, Train loss: -1.0509, rewards: 0.5065\n",
      "Iteration: 1760, Train loss: -1.0335, rewards: 0.4888\n",
      "Iteration: 1770, Train loss: -1.0313, rewards: 0.4948\n",
      "Iteration: 1780, Train loss: -0.9368, rewards: 0.4732\n",
      "Iteration: 1790, Train loss: -0.9590, rewards: 0.4917\n",
      "Iteration: 1800, Train loss: -1.0487, rewards: 0.4928\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5532, Hits@10: 0.5638, MRR: 0.5519\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.9814, rewards: 0.4518\n",
      "Iteration: 1820, Train loss: -0.8644, rewards: 0.4495\n",
      "Iteration: 1830, Train loss: -0.9848, rewards: 0.4665\n",
      "Iteration: 1840, Train loss: -0.9780, rewards: 0.4683\n",
      "Iteration: 1850, Train loss: -0.9444, rewards: 0.4910\n",
      "Iteration: 1860, Train loss: -0.9887, rewards: 0.4918\n",
      "Iteration: 1870, Train loss: -1.0386, rewards: 0.5143\n",
      "Iteration: 1880, Train loss: -0.8982, rewards: 0.4665\n",
      "Iteration: 1890, Train loss: -0.9398, rewards: 0.5345\n",
      "Iteration: 1900, Train loss: -1.0180, rewards: 0.4380\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5638, Hits@10: 0.5851, MRR: 0.5572\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -0.8528, rewards: 0.4435\n",
      "Iteration: 1920, Train loss: -0.8906, rewards: 0.4262\n",
      "Iteration: 1930, Train loss: -0.9645, rewards: 0.4713\n",
      "Iteration: 1940, Train loss: -1.0608, rewards: 0.4710\n",
      "Iteration: 1950, Train loss: -0.8647, rewards: 0.5043\n",
      "Iteration: 1960, Train loss: -0.8093, rewards: 0.5538\n",
      "Iteration: 1970, Train loss: -0.9085, rewards: 0.4620\n",
      "Iteration: 1980, Train loss: -0.9862, rewards: 0.5170\n",
      "Iteration: 1990, Train loss: -0.8789, rewards: 0.4895\n",
      "Iteration: 2000, Train loss: -1.0040, rewards: 0.4652\n",
      "Eval:\n",
      "Hits@1: 0.5479, Hits@3: 0.5585, Hits@10: 0.5691, MRR: 0.5550\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personborninlocation//test_beam/ ]\n",
      "Hits@1: 0.5337, Hits@3: 0.5959, Hits@10: 0.6995, MRR: 0.5789\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.7803506942107977 (193 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-29 00:27:06,601]\u001b[0m Trial 3 finished with value: 0.7803506942107977 and parameters: {'lr': 0.003119060715398256, 'bs': 30, 'b': 0.4489498520770626, 'l': 0.35194565509672604, 'ee': 100}. Best is trial 3 with value: 0.7803506942107977.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.0767, rewards: 0.4664\n",
      "Iteration: 10, Train loss: -0.0074, rewards: 0.5545\n",
      "Iteration: 15, Train loss: -0.0043, rewards: 0.4882\n",
      "Iteration: 20, Train loss: -0.0000, rewards: 0.5727\n",
      "Iteration: 25, Train loss: -0.0000, rewards: 0.5273\n",
      "Iteration: 30, Train loss: -0.0000, rewards: 0.5818\n",
      "Iteration: 35, Train loss: -0.0000, rewards: 0.4909\n",
      "Iteration: 40, Train loss: -0.0025, rewards: 0.5455\n",
      "Iteration: 45, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 50, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.2287, Hits@3: 0.2340, Hits@10: 0.2553, MRR: 0.2359\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.0001, rewards: 0.2909\n",
      "Iteration: 60, Train loss: -0.0000, rewards: 0.3273\n",
      "Iteration: 65, Train loss: -0.0000, rewards: 0.1727\n",
      "Iteration: 70, Train loss: -0.0000, rewards: 0.0909\n",
      "Iteration: 75, Train loss: -0.0005, rewards: 0.0818\n",
      "Iteration: 80, Train loss: -0.0000, rewards: 0.3455\n",
      "Iteration: 85, Train loss: -0.0013, rewards: 0.3455\n",
      "Iteration: 90, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 95, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 100, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0016\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.0000, rewards: 0.0091\n",
      "Iteration: 110, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 115, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 120, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 125, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 130, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 135, Train loss: -0.0000, rewards: 0.0091\n",
      "Iteration: 140, Train loss: -0.0000, rewards: 0.0818\n",
      "Iteration: 145, Train loss: -0.0000, rewards: 0.3273\n",
      "Iteration: 150, Train loss: -0.0015, rewards: 0.3000\n",
      "Eval:\n",
      "Hits@1: 0.2447, Hits@3: 0.2660, Hits@10: 0.3723, MRR: 0.2795\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.0002, rewards: 0.2455\n",
      "Iteration: 160, Train loss: -0.0004, rewards: 0.5182\n",
      "Iteration: 165, Train loss: -0.0032, rewards: 0.4545\n",
      "Iteration: 170, Train loss: -0.0281, rewards: 0.6000\n",
      "Iteration: 175, Train loss: -0.0089, rewards: 0.3000\n",
      "Iteration: 180, Train loss: -0.0118, rewards: 0.4727\n",
      "Iteration: 185, Train loss: -0.0060, rewards: 0.5000\n",
      "Iteration: 190, Train loss: -0.0071, rewards: 0.5273\n",
      "Iteration: 195, Train loss: -0.0095, rewards: 0.4455\n",
      "Iteration: 200, Train loss: -0.0143, rewards: 0.5727\n",
      "Eval:\n",
      "Hits@1: 0.5160, Hits@3: 0.5213, Hits@10: 0.5372, MRR: 0.5209\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.0029, rewards: 0.5545\n",
      "Iteration: 210, Train loss: -0.0097, rewards: 0.6091\n",
      "Iteration: 215, Train loss: -0.0035, rewards: 0.4909\n",
      "Iteration: 220, Train loss: -0.0032, rewards: 0.4909\n",
      "Iteration: 225, Train loss: -0.0072, rewards: 0.3000\n",
      "Iteration: 230, Train loss: -0.0015, rewards: 0.3818\n",
      "Iteration: 235, Train loss: -0.0004, rewards: 0.2091\n",
      "Iteration: 240, Train loss: -0.0026, rewards: 0.0182\n",
      "Iteration: 245, Train loss: -0.0016, rewards: 0.0182\n",
      "Iteration: 250, Train loss: -0.0027, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0053, Hits@3: 0.2021, Hits@10: 0.2979, MRR: 0.0960\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.0048, rewards: 0.0000\n",
      "Iteration: 260, Train loss: -0.0116, rewards: 0.2000\n",
      "Iteration: 265, Train loss: -0.0114, rewards: 0.2455\n",
      "Iteration: 270, Train loss: -0.0014, rewards: 0.0000\n",
      "Iteration: 275, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 280, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 285, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 290, Train loss: -0.0017, rewards: 0.0091\n",
      "Iteration: 295, Train loss: -0.0017, rewards: 0.0000\n",
      "Iteration: 300, Train loss: -0.0004, rewards: 0.0091\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.1862, Hits@10: 0.2128, MRR: 0.1191\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.0020, rewards: 0.0000\n",
      "Iteration: 310, Train loss: -0.0015, rewards: 0.0000\n",
      "Iteration: 315, Train loss: -0.0044, rewards: 0.0182\n",
      "Iteration: 320, Train loss: -0.0008, rewards: 0.0000\n",
      "Iteration: 325, Train loss: -0.0016, rewards: 0.0000\n",
      "Iteration: 330, Train loss: -0.0008, rewards: 0.0000\n",
      "Iteration: 335, Train loss: -0.0020, rewards: 0.0000\n",
      "Iteration: 340, Train loss: -0.0012, rewards: 0.0000\n",
      "Iteration: 345, Train loss: -0.0024, rewards: 0.0000\n",
      "Iteration: 350, Train loss: -0.0007, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0160, Hits@10: 0.0160, MRR: 0.0435\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -0.0020, rewards: 0.0000\n",
      "Iteration: 360, Train loss: -0.0015, rewards: 0.0000\n",
      "Iteration: 365, Train loss: -0.0017, rewards: 0.0000\n"
     ]
    }
   ],
   "source": [
    "sub_task = sub_tasks_list[0]\n",
    "study = optuna.create_study(storage=f\"sqlite:///{sub_task}.db\", study_name=f\"{sub_task}\", direction = 'maximize')\n",
    "study.optimize(objective, n_trials=1000)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
