{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "b2479ab1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-0bf58d0a-b3c9-59ef-811b-2885c7169709\"\n",
    "\n",
    "from model.ours3 import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "a39d5a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    \n",
    "    options['use_cuda'] = True\n",
    "    options['vocab_dir'] = '../MINERVA/datasets/data_preprocessed/nell/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_nell995-1/'\n",
    "        options['output_dir'] = './outputs_nell995-1/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_nell995-1/'\n",
    "        options['model_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = 1\n",
    "    options['max_num_actions'] = 40\n",
    "    options['gnn_layer'] = 2\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 40\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = 64\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = 0.15\n",
    "    options['Lambda'] = 0.15\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = 0.00005\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 5\n",
    "    options['total_iterations'] = 20*(64/options['batch_size'])\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "12f1b8ba",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n"
     ]
    }
   ],
   "source": [
    "params = set_params()\n",
    "params['test_rollouts'] = 100\n",
    "params['max_num_actions'] = 100\n",
    "params['eval_batch_size'] = 8\n",
    "\n",
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "17bc5425",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8207787473535506 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6278593427818233 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.572523027000639 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8249362244897959 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9319237147595357 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.9153204137843777 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.8065181795751745 (193 queries evaluated)\n",
      "WorksFor.txt\n",
      "MINERVA MAP: 0.8287528177373783 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.9408317251690747 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8386739927983896 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "map_list = {}    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "    \n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    map_list[sub_task] = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              trainer.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "10a372ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "import optuna\n",
    "from model.ours3 import *\n",
    "global sub_tasks_list\n",
    "\n",
    "sub_tasks_list = [\n",
    "# 'AthletePlaysInLeague',\n",
    "# 'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium'\n",
    "# 'TeamPlaysSport',\n",
    "# 'AthletePlaysSport',\n",
    "# 'OrganizationHiredPerson',\n",
    "# 'PersonBornInLocation',\n",
    "# 'WorksFor',\n",
    "# 'organizationheadquarteredincity',\n",
    "#'PersonLeadsOrganization'\n",
    "]\n",
    "\n",
    "def objective(trial):\n",
    "    \n",
    "    sub_task = sub_tasks_list[0]\n",
    "\n",
    "    lr = trial.suggest_float('lr', 1e-6, 1e-2)\n",
    "    bs = trial.suggest_int('bs', 4, 128)\n",
    "    b = trial.suggest_float('b', 0, 0.5)\n",
    "    l = trial.suggest_float('l', 0, 0.5)\n",
    "    ee = trial.suggest_categorical('ee', [10,20,50,100])\n",
    "\n",
    "    params = set_params(sub_task.lower().strip())\n",
    "    params['learning_rate'] = lr\n",
    "    params['eval_every'] = ee\n",
    "    params['batch_size'] = bs\n",
    "    params['beta'] = b\n",
    "    params['Lambda'] = l\n",
    "    params['total_iterations'] = min(50*params['eval_every'], 2000)\n",
    "\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    #     torch.save(sub_trainer.agent.state_dict(), params['model_dir'] + 'tmp.ckpt')\n",
    "\n",
    "    params['test_rollouts'] = 100\n",
    "    params['max_num_actions'] = 100\n",
    "    params['eval_batch_size'] = 8\n",
    "\n",
    "    sub_tester = Trainer(params)\n",
    "    sub_tester.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_tester.agent.eval()\n",
    "\n",
    "    save_path = sub_tester.save_path\n",
    "    output_dir = sub_tester.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_tester.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_tester.test_environment = sub_tester.test_test_environment\n",
    "    test_results = sub_tester.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_tester.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "\n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              sub_tester.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')\n",
    "\n",
    "    del sub_tester, sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()\n",
    "    \n",
    "    return MAP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f2971eba",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:11:07,130]\u001b[0m A new study created in RDB with name: AthleteHomeStadium\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.0955, rewards: 0.0229\n",
      "Iteration: 20, Train loss: -0.2768, rewards: 0.1571\n",
      "Iteration: 30, Train loss: -0.1327, rewards: 0.6671\n",
      "Iteration: 40, Train loss: -0.0130, rewards: 0.2000\n",
      "Iteration: 50, Train loss: -0.0090, rewards: 0.0000\n",
      "Iteration: 60, Train loss: -0.0094, rewards: 0.0000\n",
      "Iteration: 70, Train loss: -0.0011, rewards: 0.0000\n",
      "Iteration: 80, Train loss: -0.0010, rewards: 0.0000\n",
      "Iteration: 90, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 100, Train loss: -0.0013, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0249, MRR: 0.0044\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.0055, rewards: 0.0000\n",
      "Iteration: 120, Train loss: -0.0011, rewards: 0.0000\n",
      "Iteration: 130, Train loss: 0.0082, rewards: 0.0286\n",
      "Iteration: 140, Train loss: -0.0204, rewards: 0.5171\n",
      "Iteration: 150, Train loss: -0.0273, rewards: 0.3357\n",
      "Iteration: 160, Train loss: -0.0011, rewards: 0.0000\n",
      "Iteration: 170, Train loss: -0.0007, rewards: 0.0143\n",
      "Iteration: 180, Train loss: -0.0000, rewards: 0.0857\n",
      "Iteration: 190, Train loss: -0.0001, rewards: 0.1857\n",
      "Iteration: 200, Train loss: -0.0000, rewards: 0.3143\n",
      "Eval:\n",
      "Hits@1: 0.3035, Hits@3: 0.6020, Hits@10: 0.6318, MRR: 0.4612\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.0071, rewards: 0.3286\n",
      "Iteration: 220, Train loss: -0.0050, rewards: 0.6857\n",
      "Iteration: 230, Train loss: -0.0019, rewards: 0.5286\n",
      "Iteration: 240, Train loss: -0.0032, rewards: 0.5000\n",
      "Iteration: 250, Train loss: -0.0007, rewards: 0.4286\n",
      "Iteration: 260, Train loss: -0.0083, rewards: 0.4143\n",
      "Iteration: 270, Train loss: 0.0082, rewards: 0.3429\n",
      "Iteration: 280, Train loss: 0.0130, rewards: 0.4000\n",
      "Iteration: 290, Train loss: 0.0343, rewards: 0.3714\n",
      "Iteration: 300, Train loss: 0.0009, rewards: 0.3429\n",
      "Eval:\n",
      "Hits@1: 0.3781, Hits@3: 0.7015, Hits@10: 0.7164, MRR: 0.5362\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: 0.0023, rewards: 0.3000\n",
      "Iteration: 320, Train loss: 0.0188, rewards: 0.3286\n",
      "Iteration: 330, Train loss: 0.0072, rewards: 0.5000\n",
      "Iteration: 340, Train loss: 0.0048, rewards: 0.5143\n",
      "Iteration: 350, Train loss: 0.0201, rewards: 0.3857\n",
      "Iteration: 360, Train loss: 0.0060, rewards: 0.4143\n",
      "Iteration: 370, Train loss: 0.0199, rewards: 0.3857\n",
      "Iteration: 380, Train loss: 0.0046, rewards: 0.4143\n",
      "Iteration: 390, Train loss: 0.0150, rewards: 0.4571\n",
      "Iteration: 400, Train loss: 0.0220, rewards: 0.4429\n",
      "Eval:\n",
      "Hits@1: 0.3930, Hits@3: 0.7065, Hits@10: 0.7164, MRR: 0.5439\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: 0.0129, rewards: 0.4286\n",
      "Iteration: 420, Train loss: 0.0123, rewards: 0.4714\n",
      "Iteration: 430, Train loss: 0.0203, rewards: 0.4143\n",
      "Iteration: 440, Train loss: 0.0252, rewards: 0.4571\n",
      "Iteration: 450, Train loss: 0.0266, rewards: 0.4857\n",
      "Iteration: 460, Train loss: 0.0122, rewards: 0.3143\n",
      "Iteration: 470, Train loss: 0.0150, rewards: 0.5143\n",
      "Iteration: 480, Train loss: 0.0041, rewards: 0.4286\n",
      "Iteration: 490, Train loss: 0.0063, rewards: 0.4286\n",
      "Iteration: 500, Train loss: 0.0054, rewards: 0.4000\n",
      "Eval:\n",
      "Hits@1: 0.3980, Hits@3: 0.7065, Hits@10: 0.7164, MRR: 0.5481\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: 0.0035, rewards: 0.3571\n",
      "Iteration: 520, Train loss: 0.0114, rewards: 0.3857\n",
      "Iteration: 530, Train loss: 0.0107, rewards: 0.4714\n",
      "Iteration: 540, Train loss: 0.0166, rewards: 0.4286\n",
      "Iteration: 550, Train loss: 0.0026, rewards: 0.3857\n",
      "Iteration: 560, Train loss: 0.0034, rewards: 0.3571\n",
      "Iteration: 570, Train loss: 0.0103, rewards: 0.4143\n",
      "Iteration: 580, Train loss: 0.0086, rewards: 0.2714\n",
      "Iteration: 590, Train loss: 0.0041, rewards: 0.4143\n",
      "Iteration: 600, Train loss: -0.0292, rewards: 0.5714\n",
      "Eval:\n",
      "Hits@1: 0.5075, Hits@3: 0.6468, Hits@10: 0.7164, MRR: 0.5905\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.0148, rewards: 0.5714\n",
      "Iteration: 620, Train loss: -0.0309, rewards: 0.5143\n",
      "Iteration: 630, Train loss: -0.0458, rewards: 0.5143\n",
      "Iteration: 640, Train loss: 0.0079, rewards: 0.5857\n",
      "Iteration: 650, Train loss: -0.0524, rewards: 0.5271\n",
      "Iteration: 660, Train loss: 0.0063, rewards: 0.5143\n",
      "Iteration: 670, Train loss: 0.0093, rewards: 0.3714\n",
      "Iteration: 680, Train loss: -0.0015, rewards: 0.6000\n",
      "Iteration: 690, Train loss: 0.0216, rewards: 0.4571\n",
      "Iteration: 700, Train loss: 0.0146, rewards: 0.4864\n",
      "Eval:\n",
      "Hits@1: 0.5522, Hits@3: 0.5970, Hits@10: 0.7065, MRR: 0.5935\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.0013, rewards: 0.5571\n",
      "Iteration: 720, Train loss: -0.0089, rewards: 0.5143\n",
      "Iteration: 730, Train loss: 0.0170, rewards: 0.5429\n",
      "Iteration: 740, Train loss: 0.0021, rewards: 0.5857\n",
      "Iteration: 750, Train loss: 0.0095, rewards: 0.6000\n",
      "Iteration: 760, Train loss: -0.0023, rewards: 0.5714\n",
      "Iteration: 770, Train loss: 0.0092, rewards: 0.4000\n",
      "Iteration: 780, Train loss: -0.0013, rewards: 0.4571\n",
      "Iteration: 790, Train loss: 0.0140, rewards: 0.4429\n",
      "Iteration: 800, Train loss: 0.0077, rewards: 0.4857\n",
      "Eval:\n",
      "Hits@1: 0.4826, Hits@3: 0.5522, Hits@10: 0.6617, MRR: 0.5341\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: 0.0018, rewards: 0.5286\n",
      "Iteration: 820, Train loss: 0.0010, rewards: 0.4714\n",
      "Iteration: 830, Train loss: -0.0081, rewards: 0.5000\n",
      "Iteration: 840, Train loss: -0.0078, rewards: 0.4286\n",
      "Iteration: 850, Train loss: 0.0133, rewards: 0.4000\n",
      "Iteration: 860, Train loss: 0.0083, rewards: 0.4857\n",
      "Iteration: 870, Train loss: 0.0048, rewards: 0.4714\n",
      "Iteration: 880, Train loss: -0.0049, rewards: 0.3857\n",
      "Iteration: 890, Train loss: 0.0013, rewards: 0.4714\n",
      "Iteration: 900, Train loss: 0.0065, rewards: 0.5286\n",
      "Eval:\n",
      "Hits@1: 0.4129, Hits@3: 0.5522, Hits@10: 0.6418, MRR: 0.4848\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.0061, rewards: 0.4000\n",
      "Iteration: 920, Train loss: -0.0002, rewards: 0.3857\n",
      "Iteration: 930, Train loss: 0.0092, rewards: 0.4000\n",
      "Iteration: 940, Train loss: -0.0074, rewards: 0.4143\n",
      "Iteration: 950, Train loss: 0.0104, rewards: 0.5000\n",
      "Iteration: 960, Train loss: 0.0042, rewards: 0.4143\n",
      "Iteration: 970, Train loss: 0.0060, rewards: 0.5000\n",
      "Iteration: 980, Train loss: -0.0056, rewards: 0.3857\n",
      "Iteration: 990, Train loss: -0.0017, rewards: 0.4000\n",
      "Iteration: 1000, Train loss: -0.0052, rewards: 0.4857\n",
      "Eval:\n",
      "Hits@1: 0.3930, Hits@3: 0.5075, Hits@10: 0.6169, MRR: 0.4693\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: 0.0144, rewards: 0.3714\n",
      "Iteration: 1020, Train loss: 0.0076, rewards: 0.4429\n",
      "Iteration: 1030, Train loss: 0.0163, rewards: 0.4286\n",
      "Iteration: 1040, Train loss: -0.0055, rewards: 0.3143\n",
      "Iteration: 1050, Train loss: 0.0093, rewards: 0.3714\n",
      "Iteration: 1060, Train loss: -0.0089, rewards: 0.3571\n",
      "Iteration: 1070, Train loss: -0.0020, rewards: 0.3000\n",
      "Iteration: 1080, Train loss: -0.0004, rewards: 0.3857\n",
      "Iteration: 1090, Train loss: 0.0127, rewards: 0.3857\n",
      "Iteration: 1100, Train loss: -0.0035, rewards: 0.3143\n",
      "Eval:\n",
      "Hits@1: 0.1493, Hits@3: 0.5821, Hits@10: 0.6667, MRR: 0.3640\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.0096, rewards: 0.2571\n",
      "Iteration: 1120, Train loss: -0.0014, rewards: 0.2857\n",
      "Iteration: 1130, Train loss: 0.0055, rewards: 0.2857\n",
      "Iteration: 1140, Train loss: -0.0011, rewards: 0.3143\n",
      "Iteration: 1150, Train loss: 0.0129, rewards: 0.0571\n",
      "Iteration: 1160, Train loss: 0.0037, rewards: 0.1857\n",
      "Iteration: 1170, Train loss: -0.0001, rewards: 0.1000\n",
      "Iteration: 1180, Train loss: 0.0051, rewards: 0.1286\n",
      "Iteration: 1190, Train loss: -0.0000, rewards: 0.0714\n",
      "Iteration: 1200, Train loss: 0.0080, rewards: 0.0857\n",
      "Eval:\n",
      "Hits@1: 0.0647, Hits@3: 0.3184, Hits@10: 0.5473, MRR: 0.2367\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.0004, rewards: 0.1000\n",
      "Iteration: 1220, Train loss: 0.0107, rewards: 0.0571\n",
      "Iteration: 1230, Train loss: -0.0007, rewards: 0.1000\n",
      "Iteration: 1240, Train loss: -0.0000, rewards: 0.2000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1250, Train loss: -0.0015, rewards: 0.0714\n",
      "Iteration: 1260, Train loss: 0.0184, rewards: 0.1857\n",
      "Iteration: 1270, Train loss: 0.0034, rewards: 0.1000\n",
      "Iteration: 1280, Train loss: 0.0024, rewards: 0.1000\n",
      "Iteration: 1290, Train loss: -0.0000, rewards: 0.1429\n",
      "Iteration: 1300, Train loss: -0.0003, rewards: 0.0571\n",
      "Eval:\n",
      "Hits@1: 0.0597, Hits@3: 0.4229, Hits@10: 0.6269, MRR: 0.2639\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.0001, rewards: 0.0429\n",
      "Iteration: 1320, Train loss: -0.0001, rewards: 0.0571\n",
      "Iteration: 1330, Train loss: 0.0077, rewards: 0.0429\n",
      "Iteration: 1340, Train loss: -0.0001, rewards: 0.0571\n",
      "Iteration: 1350, Train loss: -0.0031, rewards: 0.0286\n",
      "Iteration: 1360, Train loss: -0.0003, rewards: 0.0286\n",
      "Iteration: 1370, Train loss: 0.0185, rewards: 0.0714\n",
      "Iteration: 1380, Train loss: -0.0016, rewards: 0.0429\n",
      "Iteration: 1390, Train loss: -0.0001, rewards: 0.0286\n",
      "Iteration: 1400, Train loss: -0.0001, rewards: 0.0429\n",
      "Eval:\n",
      "Hits@1: 0.0597, Hits@3: 0.4428, Hits@10: 0.6368, MRR: 0.2687\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.0001, rewards: 0.0286\n",
      "Iteration: 1420, Train loss: 0.0047, rewards: 0.0286\n",
      "Iteration: 1430, Train loss: 0.0068, rewards: 0.0429\n",
      "Iteration: 1440, Train loss: -0.0003, rewards: 0.0286\n",
      "Iteration: 1450, Train loss: -0.0000, rewards: 0.0286\n",
      "Iteration: 1460, Train loss: 0.0083, rewards: 0.0857\n",
      "Iteration: 1470, Train loss: 0.0086, rewards: 0.0714\n",
      "Iteration: 1480, Train loss: 0.0066, rewards: 0.0714\n",
      "Iteration: 1490, Train loss: 0.0036, rewards: 0.0571\n",
      "Iteration: 1500, Train loss: -0.0016, rewards: 0.0714\n",
      "Eval:\n",
      "Hits@1: 0.0547, Hits@3: 0.4378, Hits@10: 0.6368, MRR: 0.2658\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: 0.0117, rewards: 0.1000\n",
      "Iteration: 1520, Train loss: 0.0117, rewards: 0.1000\n",
      "Iteration: 1530, Train loss: -0.0001, rewards: 0.0429\n",
      "Iteration: 1540, Train loss: 0.0077, rewards: 0.0429\n",
      "Iteration: 1550, Train loss: -0.0003, rewards: 0.0429\n",
      "Iteration: 1560, Train loss: -0.0004, rewards: 0.0143\n",
      "Iteration: 1570, Train loss: -0.0000, rewards: 0.0714\n",
      "Iteration: 1580, Train loss: 0.0074, rewards: 0.0571\n",
      "Iteration: 1590, Train loss: -0.0000, rewards: 0.0429\n",
      "Iteration: 1600, Train loss: 0.0072, rewards: 0.0286\n",
      "Eval:\n",
      "Hits@1: 0.0448, Hits@3: 0.4279, Hits@10: 0.6368, MRR: 0.2594\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: 0.0077, rewards: 0.0857\n",
      "Iteration: 1620, Train loss: -0.0017, rewards: 0.0429\n",
      "Iteration: 1630, Train loss: 0.0187, rewards: 0.0429\n",
      "Iteration: 1640, Train loss: -0.0000, rewards: 0.0286\n",
      "Iteration: 1650, Train loss: 0.0110, rewards: 0.0714\n",
      "Iteration: 1660, Train loss: 0.0036, rewards: 0.0857\n",
      "Iteration: 1670, Train loss: 0.0138, rewards: 0.0571\n",
      "Iteration: 1680, Train loss: 0.0056, rewards: 0.0143\n",
      "Iteration: 1690, Train loss: -0.0007, rewards: 0.0571\n",
      "Iteration: 1700, Train loss: 0.0090, rewards: 0.0857\n",
      "Eval:\n",
      "Hits@1: 0.0498, Hits@3: 0.4279, Hits@10: 0.6070, MRR: 0.2585\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: 0.0077, rewards: 0.0429\n",
      "Iteration: 1720, Train loss: 0.0079, rewards: 0.0714\n",
      "Iteration: 1730, Train loss: 0.0230, rewards: 0.0571\n",
      "Iteration: 1740, Train loss: -0.0003, rewards: 0.0429\n",
      "Iteration: 1750, Train loss: -0.0004, rewards: 0.0286\n",
      "Iteration: 1760, Train loss: -0.0015, rewards: 0.0429\n",
      "Iteration: 1770, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 1780, Train loss: 0.0109, rewards: 0.1286\n",
      "Iteration: 1790, Train loss: 0.0063, rewards: 0.0286\n",
      "Iteration: 1800, Train loss: -0.0001, rewards: 0.0714\n",
      "Eval:\n",
      "Hits@1: 0.0498, Hits@3: 0.4229, Hits@10: 0.6070, MRR: 0.2537\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.0003, rewards: 0.0429\n",
      "Iteration: 1820, Train loss: -0.0001, rewards: 0.0286\n",
      "Iteration: 1830, Train loss: 0.0141, rewards: 0.0714\n",
      "Iteration: 1840, Train loss: 0.0159, rewards: 0.0429\n",
      "Iteration: 1850, Train loss: 0.0122, rewards: 0.0714\n",
      "Iteration: 1860, Train loss: -0.0001, rewards: 0.0429\n",
      "Iteration: 1870, Train loss: -0.0000, rewards: 0.0143\n",
      "Iteration: 1880, Train loss: -0.0000, rewards: 0.0286\n",
      "Iteration: 1890, Train loss: -0.0017, rewards: 0.0429\n",
      "Iteration: 1900, Train loss: 0.0110, rewards: 0.0429\n",
      "Eval:\n",
      "Hits@1: 0.0498, Hits@3: 0.4229, Hits@10: 0.6070, MRR: 0.2537\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: 0.0054, rewards: 0.0286\n",
      "Iteration: 1920, Train loss: -0.0001, rewards: 0.1000\n",
      "Iteration: 1930, Train loss: -0.0001, rewards: 0.0714\n",
      "Iteration: 1940, Train loss: -0.0002, rewards: 0.0571\n",
      "Iteration: 1950, Train loss: 0.0159, rewards: 0.0429\n",
      "Iteration: 1960, Train loss: 0.0120, rewards: 0.0571\n",
      "Iteration: 1970, Train loss: -0.0000, rewards: 0.0429\n",
      "Iteration: 1980, Train loss: 0.0143, rewards: 0.0714\n",
      "Iteration: 1990, Train loss: -0.0001, rewards: 0.0429\n",
      "Iteration: 2000, Train loss: 0.0079, rewards: 0.0143\n",
      "Eval:\n",
      "Hits@1: 0.0498, Hits@3: 0.4229, Hits@10: 0.6070, MRR: 0.2560\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/athletehomestadium//test_beam/ ]\n",
      "Hits@1: 0.6070, Hits@3: 0.7214, Hits@10: 0.7910, MRR: 0.6730\n",
      "AthleteHomeStadium\n",
      "MINERVA MAP: 0.8576843416395655 (201 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:35:41,665]\u001b[0m Trial 0 finished with value: 0.8576843416395655 and parameters: {'lr': 0.006879074651296699, 'bs': 7, 'b': 0.040941313826224734, 'l': 0.4138501113958198, 'ee': 100}. Best is trial 0 with value: 0.8576843416395655.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.7547, rewards: 0.3623\n",
      "Iteration: 10, Train loss: -0.4716, rewards: 0.6801\n",
      "Iteration: 15, Train loss: -0.8122, rewards: 0.6068\n",
      "Iteration: 20, Train loss: -0.8496, rewards: 0.6048\n",
      "Iteration: 25, Train loss: -0.8107, rewards: 0.6515\n",
      "Iteration: 30, Train loss: -0.8854, rewards: 0.6623\n",
      "Iteration: 35, Train loss: -0.8532, rewards: 0.6944\n",
      "Iteration: 40, Train loss: -0.9013, rewards: 0.6469\n",
      "Iteration: 45, Train loss: -0.8650, rewards: 0.7139\n",
      "Iteration: 50, Train loss: -0.8571, rewards: 0.6700\n",
      "Eval:\n",
      "Hits@1: 0.7811, Hits@3: 0.7910, Hits@10: 0.8010, MRR: 0.7857\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.8352, rewards: 0.6877\n",
      "Iteration: 60, Train loss: -0.8545, rewards: 0.6735\n",
      "Iteration: 65, Train loss: -0.7518, rewards: 0.7031\n",
      "Iteration: 70, Train loss: -0.8851, rewards: 0.6857\n",
      "Iteration: 75, Train loss: -0.9903, rewards: 0.6736\n",
      "Iteration: 80, Train loss: -0.7288, rewards: 0.7508\n",
      "Iteration: 85, Train loss: -0.6362, rewards: 0.8085\n",
      "Iteration: 90, Train loss: -0.7801, rewards: 0.6958\n",
      "Iteration: 95, Train loss: -0.7920, rewards: 0.7456\n",
      "Iteration: 100, Train loss: -0.9697, rewards: 0.7283\n",
      "Eval:\n",
      "Hits@1: 0.7662, Hits@3: 0.7761, Hits@10: 0.7811, MRR: 0.7724\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.9126, rewards: 0.7450\n",
      "Iteration: 110, Train loss: -0.8745, rewards: 0.7373\n",
      "Iteration: 115, Train loss: -0.9357, rewards: 0.6993\n",
      "Iteration: 120, Train loss: -0.9629, rewards: 0.7523\n",
      "Iteration: 125, Train loss: -1.0418, rewards: 0.7106\n",
      "Iteration: 130, Train loss: -1.0127, rewards: 0.6919\n",
      "Iteration: 135, Train loss: -0.9201, rewards: 0.7242\n",
      "Iteration: 140, Train loss: -0.9669, rewards: 0.7471\n",
      "Iteration: 145, Train loss: -1.0720, rewards: 0.7076\n",
      "Iteration: 150, Train loss: -1.0536, rewards: 0.7263\n",
      "Eval:\n",
      "Hits@1: 0.7413, Hits@3: 0.7811, Hits@10: 0.7811, MRR: 0.7612\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.9637, rewards: 0.7412\n",
      "Iteration: 160, Train loss: -0.9633, rewards: 0.7600\n",
      "Iteration: 165, Train loss: -0.9168, rewards: 0.7169\n",
      "Iteration: 170, Train loss: -1.0074, rewards: 0.7198\n",
      "Iteration: 175, Train loss: -1.0106, rewards: 0.7295\n",
      "Iteration: 180, Train loss: -0.8154, rewards: 0.7608\n",
      "Iteration: 185, Train loss: -0.9286, rewards: 0.7338\n",
      "Iteration: 190, Train loss: -0.9151, rewards: 0.7532\n",
      "Iteration: 195, Train loss: -0.9267, rewards: 0.7938\n",
      "Iteration: 200, Train loss: -1.0022, rewards: 0.7130\n",
      "Eval:\n",
      "Hits@1: 0.7662, Hits@3: 0.7811, Hits@10: 0.7811, MRR: 0.7738\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.9803, rewards: 0.7211\n",
      "Iteration: 210, Train loss: -0.9209, rewards: 0.7508\n",
      "Iteration: 215, Train loss: -0.9873, rewards: 0.7354\n",
      "Iteration: 220, Train loss: -1.0068, rewards: 0.7477\n",
      "Iteration: 225, Train loss: -0.9048, rewards: 0.7646\n",
      "Iteration: 230, Train loss: -0.9581, rewards: 0.7662\n",
      "Iteration: 235, Train loss: -1.0906, rewards: 0.7032\n",
      "Iteration: 240, Train loss: -0.9598, rewards: 0.7825\n",
      "Iteration: 245, Train loss: -1.0036, rewards: 0.7330\n",
      "Iteration: 250, Train loss: -1.0593, rewards: 0.7212\n",
      "Eval:\n",
      "Hits@1: 0.7711, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7778\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.8925, rewards: 0.7500\n",
      "Iteration: 260, Train loss: -0.8928, rewards: 0.7576\n",
      "Iteration: 265, Train loss: -0.9811, rewards: 0.7306\n",
      "Iteration: 270, Train loss: -0.9769, rewards: 0.7036\n",
      "Iteration: 275, Train loss: -0.9776, rewards: 0.7400\n",
      "Iteration: 280, Train loss: -1.0219, rewards: 0.7298\n",
      "Iteration: 285, Train loss: -0.9158, rewards: 0.7588\n",
      "Iteration: 290, Train loss: -1.0252, rewards: 0.7037\n",
      "Iteration: 295, Train loss: -0.9898, rewards: 0.7296\n",
      "Iteration: 300, Train loss: -0.9460, rewards: 0.7558\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7811, Hits@10: 0.7960, MRR: 0.7597\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.9928, rewards: 0.7425\n",
      "Iteration: 310, Train loss: -1.0635, rewards: 0.6890\n",
      "Iteration: 315, Train loss: -0.9455, rewards: 0.7750\n",
      "Iteration: 320, Train loss: -0.9451, rewards: 0.7471\n",
      "Iteration: 325, Train loss: -0.9191, rewards: 0.7581\n",
      "Iteration: 330, Train loss: -0.9066, rewards: 0.7749\n",
      "Iteration: 335, Train loss: -0.9721, rewards: 0.7614\n",
      "Iteration: 340, Train loss: -1.0010, rewards: 0.7277\n",
      "Iteration: 345, Train loss: -0.9090, rewards: 0.7445\n",
      "Iteration: 350, Train loss: -0.9669, rewards: 0.7346\n",
      "Eval:\n",
      "Hits@1: 0.7662, Hits@3: 0.7811, Hits@10: 0.7811, MRR: 0.7736\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -1.0353, rewards: 0.7240\n",
      "Iteration: 360, Train loss: -1.0519, rewards: 0.6994\n",
      "Iteration: 365, Train loss: -1.0199, rewards: 0.7355\n",
      "Iteration: 370, Train loss: -1.0141, rewards: 0.7401\n",
      "Iteration: 375, Train loss: -1.0304, rewards: 0.7135\n",
      "Iteration: 380, Train loss: -1.0589, rewards: 0.7011\n",
      "Iteration: 385, Train loss: -0.9894, rewards: 0.7629\n",
      "Iteration: 390, Train loss: -0.9940, rewards: 0.7570\n",
      "Iteration: 395, Train loss: -0.9620, rewards: 0.7529\n",
      "Iteration: 400, Train loss: -0.9754, rewards: 0.7612\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7662\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -1.0083, rewards: 0.7432\n",
      "Iteration: 410, Train loss: -1.0498, rewards: 0.7208\n",
      "Iteration: 415, Train loss: -0.9535, rewards: 0.7521\n",
      "Iteration: 420, Train loss: -0.9116, rewards: 0.7574\n",
      "Iteration: 425, Train loss: -1.0309, rewards: 0.7343\n",
      "Iteration: 430, Train loss: -1.0059, rewards: 0.7512\n",
      "Iteration: 435, Train loss: -1.0053, rewards: 0.7410\n",
      "Iteration: 440, Train loss: -0.9813, rewards: 0.7286\n",
      "Iteration: 445, Train loss: -0.9827, rewards: 0.7482\n",
      "Iteration: 450, Train loss: -1.0045, rewards: 0.7265\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7587\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -0.9637, rewards: 0.7251\n",
      "Iteration: 460, Train loss: -0.9946, rewards: 0.7361\n",
      "Iteration: 465, Train loss: -1.0219, rewards: 0.7445\n",
      "Iteration: 470, Train loss: -1.0147, rewards: 0.7287\n",
      "Iteration: 475, Train loss: -0.9333, rewards: 0.7804\n",
      "Iteration: 480, Train loss: -0.8983, rewards: 0.7615\n",
      "Iteration: 485, Train loss: -1.0256, rewards: 0.7320\n",
      "Iteration: 490, Train loss: -0.9857, rewards: 0.7526\n",
      "Iteration: 495, Train loss: -1.0118, rewards: 0.7270\n",
      "Iteration: 500, Train loss: -1.0010, rewards: 0.7313\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7666\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -1.0037, rewards: 0.7326\n",
      "Iteration: 510, Train loss: -1.0476, rewards: 0.7195\n",
      "Iteration: 515, Train loss: -1.0425, rewards: 0.7449\n",
      "Iteration: 520, Train loss: -1.0597, rewards: 0.7400\n",
      "Iteration: 525, Train loss: -0.9647, rewards: 0.7474\n",
      "Iteration: 530, Train loss: -0.9445, rewards: 0.7332\n",
      "Iteration: 535, Train loss: -1.0032, rewards: 0.7399\n",
      "Iteration: 540, Train loss: -0.9230, rewards: 0.7485\n",
      "Iteration: 545, Train loss: -0.9992, rewards: 0.7496\n",
      "Iteration: 550, Train loss: -0.9580, rewards: 0.7473\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7663\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -0.9936, rewards: 0.7256\n",
      "Iteration: 560, Train loss: -0.9575, rewards: 0.7479\n",
      "Iteration: 565, Train loss: -0.9993, rewards: 0.7427\n",
      "Iteration: 570, Train loss: -1.0178, rewards: 0.7174\n",
      "Iteration: 575, Train loss: -1.0039, rewards: 0.7231\n",
      "Iteration: 580, Train loss: -0.9479, rewards: 0.7377\n",
      "Iteration: 585, Train loss: -0.8562, rewards: 0.7607\n",
      "Iteration: 590, Train loss: -1.0020, rewards: 0.7224\n",
      "Iteration: 595, Train loss: -1.0492, rewards: 0.7292\n",
      "Iteration: 600, Train loss: -1.0611, rewards: 0.7219\n",
      "Eval:\n",
      "Hits@1: 0.7662, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7753\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -0.9388, rewards: 0.7425\n",
      "Iteration: 610, Train loss: -1.0320, rewards: 0.7544\n",
      "Iteration: 615, Train loss: -0.9403, rewards: 0.7474\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -1.0116, rewards: 0.7210\n",
      "Iteration: 625, Train loss: -1.0217, rewards: 0.7180\n",
      "Iteration: 630, Train loss: -0.9910, rewards: 0.7518\n",
      "Iteration: 635, Train loss: -0.9335, rewards: 0.7605\n",
      "Iteration: 640, Train loss: -1.0244, rewards: 0.7511\n",
      "Iteration: 645, Train loss: -1.0236, rewards: 0.7489\n",
      "Iteration: 650, Train loss: -1.0855, rewards: 0.6865\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7374\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -1.0276, rewards: 0.7193\n",
      "Iteration: 660, Train loss: -1.0675, rewards: 0.7020\n",
      "Iteration: 665, Train loss: -1.0459, rewards: 0.7455\n",
      "Iteration: 670, Train loss: -1.0413, rewards: 0.6870\n",
      "Iteration: 675, Train loss: -0.9469, rewards: 0.7548\n",
      "Iteration: 680, Train loss: -1.0122, rewards: 0.7451\n",
      "Iteration: 685, Train loss: -0.9313, rewards: 0.7325\n",
      "Iteration: 690, Train loss: -0.9437, rewards: 0.7308\n",
      "Iteration: 695, Train loss: -0.9282, rewards: 0.7762\n",
      "Iteration: 700, Train loss: -0.8743, rewards: 0.7725\n",
      "Eval:\n",
      "Hits@1: 0.6318, Hits@3: 0.7711, Hits@10: 0.7711, MRR: 0.7019\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -0.9637, rewards: 0.7244\n",
      "Iteration: 710, Train loss: -0.9588, rewards: 0.7521\n",
      "Iteration: 715, Train loss: -0.9891, rewards: 0.7170\n",
      "Iteration: 720, Train loss: -0.9442, rewards: 0.7586\n",
      "Iteration: 725, Train loss: -0.9910, rewards: 0.7468\n",
      "Iteration: 730, Train loss: -1.0106, rewards: 0.7231\n",
      "Iteration: 735, Train loss: -1.0531, rewards: 0.7292\n",
      "Iteration: 740, Train loss: -1.0448, rewards: 0.7338\n",
      "Iteration: 745, Train loss: -1.0700, rewards: 0.6931\n",
      "Iteration: 750, Train loss: -0.9805, rewards: 0.7440\n",
      "Eval:\n",
      "Hits@1: 0.7363, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7612\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.9994, rewards: 0.7321\n",
      "Iteration: 760, Train loss: -1.0639, rewards: 0.7349\n",
      "Iteration: 765, Train loss: -1.0007, rewards: 0.7438\n",
      "Iteration: 770, Train loss: -1.0420, rewards: 0.7402\n",
      "Iteration: 775, Train loss: -1.0317, rewards: 0.7282\n",
      "Iteration: 780, Train loss: -0.9245, rewards: 0.7461\n",
      "Iteration: 785, Train loss: -0.8993, rewards: 0.7696\n",
      "Iteration: 790, Train loss: -0.9997, rewards: 0.7267\n",
      "Iteration: 795, Train loss: -0.9975, rewards: 0.7351\n",
      "Iteration: 800, Train loss: -1.0183, rewards: 0.7340\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7861, Hits@10: 0.8010, MRR: 0.7621\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -0.9470, rewards: 0.7143\n",
      "Iteration: 810, Train loss: -0.9538, rewards: 0.7440\n",
      "Iteration: 815, Train loss: -1.0537, rewards: 0.7226\n",
      "Iteration: 820, Train loss: -1.0067, rewards: 0.7417\n",
      "Iteration: 825, Train loss: -1.0175, rewards: 0.7332\n",
      "Iteration: 830, Train loss: -1.0564, rewards: 0.7199\n",
      "Iteration: 835, Train loss: -1.0316, rewards: 0.7389\n",
      "Iteration: 840, Train loss: -0.9784, rewards: 0.7518\n",
      "Iteration: 845, Train loss: -1.0817, rewards: 0.7251\n",
      "Iteration: 850, Train loss: -0.9637, rewards: 0.7576\n",
      "Eval:\n",
      "Hits@1: 0.7512, Hits@3: 0.7910, Hits@10: 0.8109, MRR: 0.7749\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -0.9995, rewards: 0.7473\n",
      "Iteration: 860, Train loss: -0.9935, rewards: 0.7318\n",
      "Iteration: 865, Train loss: -0.9470, rewards: 0.7165\n",
      "Iteration: 870, Train loss: -0.9889, rewards: 0.7383\n",
      "Iteration: 875, Train loss: -1.0280, rewards: 0.7207\n",
      "Iteration: 880, Train loss: -0.9000, rewards: 0.7581\n",
      "Iteration: 885, Train loss: -0.9783, rewards: 0.7663\n",
      "Iteration: 890, Train loss: -0.9936, rewards: 0.7496\n",
      "Iteration: 895, Train loss: -1.0575, rewards: 0.7040\n",
      "Iteration: 900, Train loss: -1.0681, rewards: 0.7342\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7595\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -1.0540, rewards: 0.7224\n",
      "Iteration: 910, Train loss: -1.0091, rewards: 0.7168\n",
      "Iteration: 915, Train loss: -0.9633, rewards: 0.7639\n",
      "Iteration: 920, Train loss: -0.9029, rewards: 0.7949\n",
      "Iteration: 925, Train loss: -1.0459, rewards: 0.7349\n",
      "Iteration: 930, Train loss: -0.8943, rewards: 0.7474\n",
      "Iteration: 935, Train loss: -1.0129, rewards: 0.7106\n",
      "Iteration: 940, Train loss: -0.9602, rewards: 0.7515\n",
      "Iteration: 945, Train loss: -1.0386, rewards: 0.7260\n",
      "Iteration: 950, Train loss: -1.0078, rewards: 0.7461\n",
      "Eval:\n",
      "Hits@1: 0.7164, Hits@3: 0.7861, Hits@10: 0.7960, MRR: 0.7535\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -0.8612, rewards: 0.7632\n",
      "Iteration: 960, Train loss: -0.9978, rewards: 0.7489\n",
      "Iteration: 965, Train loss: -0.9587, rewards: 0.7348\n",
      "Iteration: 970, Train loss: -0.9220, rewards: 0.7511\n",
      "Iteration: 975, Train loss: -0.9487, rewards: 0.7651\n",
      "Iteration: 980, Train loss: -0.9747, rewards: 0.7580\n",
      "Iteration: 985, Train loss: -0.9744, rewards: 0.7371\n",
      "Iteration: 990, Train loss: -0.9341, rewards: 0.7588\n",
      "Iteration: 995, Train loss: -0.8610, rewards: 0.7574\n",
      "Iteration: 1000, Train loss: -0.9864, rewards: 0.7899\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7681\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -1.0538, rewards: 0.7365\n",
      "Iteration: 1010, Train loss: -1.0195, rewards: 0.7275\n",
      "Iteration: 1015, Train loss: -0.9751, rewards: 0.7189\n",
      "Iteration: 1020, Train loss: -0.9255, rewards: 0.7567\n",
      "Iteration: 1025, Train loss: -1.0048, rewards: 0.7498\n",
      "Iteration: 1030, Train loss: -0.9696, rewards: 0.7371\n",
      "Iteration: 1035, Train loss: -0.9877, rewards: 0.7217\n",
      "Iteration: 1040, Train loss: -1.0179, rewards: 0.7473\n",
      "Iteration: 1045, Train loss: -0.9246, rewards: 0.7904\n",
      "Iteration: 1050, Train loss: -0.8488, rewards: 0.7971\n",
      "Eval:\n",
      "Hits@1: 0.7612, Hits@3: 0.7861, Hits@10: 0.7960, MRR: 0.7754\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -0.8765, rewards: 0.7554\n",
      "Iteration: 1060, Train loss: -0.9423, rewards: 0.7180\n",
      "Iteration: 1065, Train loss: -0.9960, rewards: 0.7354\n",
      "Iteration: 1070, Train loss: -0.8738, rewards: 0.7896\n",
      "Iteration: 1075, Train loss: -0.9424, rewards: 0.7712\n",
      "Iteration: 1080, Train loss: -1.0027, rewards: 0.7469\n",
      "Iteration: 1085, Train loss: -1.0427, rewards: 0.7212\n",
      "Iteration: 1090, Train loss: -1.0349, rewards: 0.7333\n",
      "Iteration: 1095, Train loss: -0.9520, rewards: 0.7451\n",
      "Iteration: 1100, Train loss: -0.8693, rewards: 0.7850\n",
      "Eval:\n",
      "Hits@1: 0.7562, Hits@3: 0.7861, Hits@10: 0.7960, MRR: 0.7726\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -1.0197, rewards: 0.7358\n",
      "Iteration: 1110, Train loss: -0.9589, rewards: 0.7436\n",
      "Iteration: 1115, Train loss: -0.9801, rewards: 0.7414\n",
      "Iteration: 1120, Train loss: -1.0067, rewards: 0.7620\n",
      "Iteration: 1125, Train loss: -0.9866, rewards: 0.7208\n",
      "Iteration: 1130, Train loss: -1.0375, rewards: 0.7327\n",
      "Iteration: 1135, Train loss: -0.9463, rewards: 0.7405\n",
      "Iteration: 1140, Train loss: -0.9270, rewards: 0.7713\n",
      "Iteration: 1145, Train loss: -1.0142, rewards: 0.7548\n",
      "Iteration: 1150, Train loss: -0.9799, rewards: 0.7260\n",
      "Eval:\n",
      "Hits@1: 0.7512, Hits@3: 0.7861, Hits@10: 0.7960, MRR: 0.7704\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -1.0705, rewards: 0.6774\n",
      "Iteration: 1160, Train loss: -0.9784, rewards: 0.7348\n",
      "Iteration: 1165, Train loss: -1.0257, rewards: 0.7299\n",
      "Iteration: 1170, Train loss: -0.9311, rewards: 0.7650\n",
      "Iteration: 1175, Train loss: -0.9680, rewards: 0.7231\n",
      "Iteration: 1180, Train loss: -0.9772, rewards: 0.7540\n",
      "Iteration: 1185, Train loss: -0.8996, rewards: 0.7652\n",
      "Iteration: 1190, Train loss: -0.8667, rewards: 0.7904\n",
      "Iteration: 1195, Train loss: -0.9463, rewards: 0.7455\n",
      "Iteration: 1200, Train loss: -0.9094, rewards: 0.7757\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7462\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -1.0089, rewards: 0.7595\n",
      "Iteration: 1210, Train loss: -0.9951, rewards: 0.7255\n",
      "Iteration: 1215, Train loss: -0.9359, rewards: 0.7760\n",
      "Iteration: 1220, Train loss: -0.9946, rewards: 0.7258\n",
      "Iteration: 1225, Train loss: -0.9583, rewards: 0.7380\n",
      "Iteration: 1230, Train loss: -0.9911, rewards: 0.7400\n",
      "Iteration: 1235, Train loss: -0.9179, rewards: 0.7614\n",
      "Iteration: 1240, Train loss: -1.0122, rewards: 0.7479\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -1.0044, rewards: 0.7330\n",
      "Iteration: 1250, Train loss: -0.9286, rewards: 0.7352\n",
      "Eval:\n",
      "Hits@1: 0.7363, Hits@3: 0.7861, Hits@10: 0.8060, MRR: 0.7646\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -0.9941, rewards: 0.7382\n",
      "Iteration: 1260, Train loss: -0.9383, rewards: 0.7690\n",
      "Iteration: 1265, Train loss: -0.9474, rewards: 0.7667\n",
      "Iteration: 1270, Train loss: -0.9527, rewards: 0.7421\n",
      "Iteration: 1275, Train loss: -0.9033, rewards: 0.7921\n",
      "Iteration: 1280, Train loss: -1.0000, rewards: 0.7212\n",
      "Iteration: 1285, Train loss: -1.0107, rewards: 0.7263\n",
      "Iteration: 1290, Train loss: -0.9888, rewards: 0.7189\n",
      "Iteration: 1295, Train loss: -0.9737, rewards: 0.7473\n",
      "Iteration: 1300, Train loss: -0.8307, rewards: 0.8014\n",
      "Eval:\n",
      "Hits@1: 0.7114, Hits@3: 0.7861, Hits@10: 0.8060, MRR: 0.7516\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -0.8534, rewards: 0.8049\n",
      "Iteration: 1310, Train loss: -1.0057, rewards: 0.7398\n",
      "Iteration: 1315, Train loss: -0.9852, rewards: 0.7331\n",
      "Iteration: 1320, Train loss: -1.0099, rewards: 0.7595\n",
      "Iteration: 1325, Train loss: -1.0040, rewards: 0.7664\n",
      "Iteration: 1330, Train loss: -0.9416, rewards: 0.7520\n",
      "Iteration: 1335, Train loss: -0.9834, rewards: 0.7429\n",
      "Iteration: 1340, Train loss: -1.0153, rewards: 0.7480\n",
      "Iteration: 1345, Train loss: -0.9605, rewards: 0.7564\n",
      "Iteration: 1350, Train loss: -0.8118, rewards: 0.7482\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7811, Hits@10: 0.7910, MRR: 0.7669\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -0.8885, rewards: 0.7550\n",
      "Iteration: 1360, Train loss: -0.9616, rewards: 0.7361\n",
      "Iteration: 1365, Train loss: -1.0421, rewards: 0.6992\n",
      "Iteration: 1370, Train loss: -0.9079, rewards: 0.7446\n",
      "Iteration: 1375, Train loss: -0.9139, rewards: 0.7554\n",
      "Iteration: 1380, Train loss: -0.8582, rewards: 0.7308\n",
      "Iteration: 1385, Train loss: -1.0319, rewards: 0.7157\n",
      "Iteration: 1390, Train loss: -0.9018, rewards: 0.7492\n",
      "Iteration: 1395, Train loss: -0.9451, rewards: 0.7196\n",
      "Iteration: 1400, Train loss: -0.9022, rewards: 0.7448\n",
      "Eval:\n",
      "Hits@1: 0.7363, Hits@3: 0.7861, Hits@10: 0.7910, MRR: 0.7617\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -0.9162, rewards: 0.7626\n",
      "Iteration: 1410, Train loss: -1.0036, rewards: 0.7267\n",
      "Iteration: 1415, Train loss: -0.9795, rewards: 0.7715\n",
      "Iteration: 1420, Train loss: -0.8610, rewards: 0.7882\n",
      "Iteration: 1425, Train loss: -1.0181, rewards: 0.6989\n",
      "Iteration: 1430, Train loss: -1.0324, rewards: 0.7435\n",
      "Iteration: 1435, Train loss: -0.9713, rewards: 0.7640\n",
      "Iteration: 1440, Train loss: -0.9603, rewards: 0.7471\n",
      "Iteration: 1445, Train loss: -0.8598, rewards: 0.7430\n",
      "Iteration: 1450, Train loss: -0.9053, rewards: 0.7533\n",
      "Eval:\n",
      "Hits@1: 0.7164, Hits@3: 0.7861, Hits@10: 0.7861, MRR: 0.7512\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -0.9665, rewards: 0.7781\n",
      "Iteration: 1460, Train loss: -0.9339, rewards: 0.7425\n",
      "Iteration: 1465, Train loss: -1.0095, rewards: 0.7167\n",
      "Iteration: 1470, Train loss: -0.8691, rewards: 0.7520\n",
      "Iteration: 1475, Train loss: -0.7987, rewards: 0.7561\n",
      "Iteration: 1480, Train loss: -0.8842, rewards: 0.7411\n",
      "Iteration: 1485, Train loss: -0.9278, rewards: 0.6915\n",
      "Iteration: 1490, Train loss: -0.9409, rewards: 0.7439\n",
      "Iteration: 1495, Train loss: -0.9803, rewards: 0.7726\n",
      "Iteration: 1500, Train loss: -0.9930, rewards: 0.7349\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7861, Hits@10: 0.8010, MRR: 0.7597\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -0.8964, rewards: 0.7457\n",
      "Iteration: 1510, Train loss: -0.9837, rewards: 0.7252\n",
      "Iteration: 1515, Train loss: -1.0814, rewards: 0.6911\n",
      "Iteration: 1520, Train loss: -0.9275, rewards: 0.7117\n",
      "Iteration: 1525, Train loss: -1.0034, rewards: 0.7154\n",
      "Iteration: 1530, Train loss: -0.8974, rewards: 0.7111\n",
      "Iteration: 1535, Train loss: -0.9978, rewards: 0.7157\n",
      "Iteration: 1540, Train loss: -0.9229, rewards: 0.7346\n",
      "Iteration: 1545, Train loss: -0.8502, rewards: 0.7744\n",
      "Iteration: 1550, Train loss: -0.9408, rewards: 0.7310\n",
      "Eval:\n",
      "Hits@1: 0.7114, Hits@3: 0.7761, Hits@10: 0.7861, MRR: 0.7452\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.8754, rewards: 0.7429\n",
      "Iteration: 1560, Train loss: -1.0121, rewards: 0.6949\n",
      "Iteration: 1565, Train loss: -0.9878, rewards: 0.7118\n",
      "Iteration: 1570, Train loss: -0.9200, rewards: 0.7518\n",
      "Iteration: 1575, Train loss: -1.0274, rewards: 0.7001\n",
      "Iteration: 1580, Train loss: -0.9708, rewards: 0.7571\n",
      "Iteration: 1585, Train loss: -0.9959, rewards: 0.7357\n",
      "Iteration: 1590, Train loss: -0.8810, rewards: 0.7281\n",
      "Iteration: 1595, Train loss: -0.9474, rewards: 0.7067\n",
      "Iteration: 1600, Train loss: -1.0315, rewards: 0.7229\n",
      "Eval:\n",
      "Hits@1: 0.7363, Hits@3: 0.7811, Hits@10: 0.8109, MRR: 0.7637\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.9208, rewards: 0.7395\n",
      "Iteration: 1610, Train loss: -0.7928, rewards: 0.7268\n",
      "Iteration: 1615, Train loss: -0.6211, rewards: 0.7443\n",
      "Iteration: 1620, Train loss: -0.5826, rewards: 0.6865\n",
      "Iteration: 1625, Train loss: -0.8661, rewards: 0.7433\n",
      "Iteration: 1630, Train loss: -1.0406, rewards: 0.6811\n",
      "Iteration: 1635, Train loss: -0.9609, rewards: 0.7458\n",
      "Iteration: 1640, Train loss: -0.9120, rewards: 0.7799\n",
      "Iteration: 1645, Train loss: -0.9742, rewards: 0.7601\n",
      "Iteration: 1650, Train loss: -0.8950, rewards: 0.7756\n",
      "Eval:\n",
      "Hits@1: 0.7413, Hits@3: 0.7861, Hits@10: 0.8010, MRR: 0.7667\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -0.7697, rewards: 0.7513\n",
      "Iteration: 1660, Train loss: -0.8844, rewards: 0.7665\n",
      "Iteration: 1665, Train loss: -1.0460, rewards: 0.7218\n",
      "Iteration: 1670, Train loss: -1.0110, rewards: 0.7425\n",
      "Iteration: 1675, Train loss: -0.8649, rewards: 0.7692\n",
      "Iteration: 1680, Train loss: -0.8569, rewards: 0.7452\n",
      "Iteration: 1685, Train loss: -0.8084, rewards: 0.7563\n",
      "Iteration: 1690, Train loss: -0.9112, rewards: 0.7521\n",
      "Iteration: 1695, Train loss: -0.9239, rewards: 0.7290\n",
      "Iteration: 1700, Train loss: -0.9530, rewards: 0.7168\n",
      "Eval:\n",
      "Hits@1: 0.7264, Hits@3: 0.7811, Hits@10: 0.8060, MRR: 0.7584\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -0.9686, rewards: 0.7337\n",
      "Iteration: 1710, Train loss: -0.9849, rewards: 0.7490\n",
      "Iteration: 1715, Train loss: -1.0778, rewards: 0.7012\n",
      "Iteration: 1720, Train loss: -1.1072, rewards: 0.7108\n",
      "Iteration: 1725, Train loss: -0.9669, rewards: 0.7569\n",
      "Iteration: 1730, Train loss: -0.8571, rewards: 0.7594\n",
      "Iteration: 1735, Train loss: -0.9513, rewards: 0.7450\n",
      "Iteration: 1740, Train loss: -0.8883, rewards: 0.7633\n",
      "Iteration: 1745, Train loss: -1.0147, rewards: 0.7392\n",
      "Iteration: 1750, Train loss: -1.0044, rewards: 0.7352\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7811, Hits@10: 0.8060, MRR: 0.7476\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.9105, rewards: 0.7582\n",
      "Iteration: 1760, Train loss: -0.9755, rewards: 0.7699\n",
      "Iteration: 1765, Train loss: -0.9077, rewards: 0.7500\n",
      "Iteration: 1770, Train loss: -0.9390, rewards: 0.7567\n",
      "Iteration: 1775, Train loss: -0.9343, rewards: 0.7357\n",
      "Iteration: 1780, Train loss: -1.0135, rewards: 0.7249\n",
      "Iteration: 1785, Train loss: -0.8931, rewards: 0.7493\n",
      "Iteration: 1790, Train loss: -1.0349, rewards: 0.7332\n",
      "Iteration: 1795, Train loss: -0.9872, rewards: 0.7590\n",
      "Iteration: 1800, Train loss: -0.9318, rewards: 0.7748\n",
      "Eval:\n",
      "Hits@1: 0.7413, Hits@3: 0.7811, Hits@10: 0.7861, MRR: 0.7618\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -1.0071, rewards: 0.7094\n",
      "Iteration: 1810, Train loss: -0.9526, rewards: 0.7707\n",
      "Iteration: 1815, Train loss: -0.9610, rewards: 0.7399\n",
      "Iteration: 1820, Train loss: -0.9664, rewards: 0.7587\n",
      "Iteration: 1825, Train loss: -0.9169, rewards: 0.7223\n",
      "Iteration: 1830, Train loss: -0.8309, rewards: 0.7902\n",
      "Iteration: 1835, Train loss: -0.9780, rewards: 0.7335\n",
      "Iteration: 1840, Train loss: -0.9136, rewards: 0.7543\n",
      "Iteration: 1845, Train loss: -0.9314, rewards: 0.7454\n",
      "Iteration: 1850, Train loss: -0.9034, rewards: 0.7392\n",
      "Eval:\n",
      "Hits@1: 0.7512, Hits@3: 0.7811, Hits@10: 0.7861, MRR: 0.7667\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -0.8987, rewards: 0.7581\n",
      "Iteration: 1860, Train loss: -0.9918, rewards: 0.7168\n",
      "Iteration: 1865, Train loss: -1.0094, rewards: 0.7261\n",
      "Iteration: 1870, Train loss: -0.9537, rewards: 0.7358\n",
      "Iteration: 1875, Train loss: -0.8844, rewards: 0.7607\n",
      "Iteration: 1880, Train loss: -0.8898, rewards: 0.7712\n",
      "Iteration: 1885, Train loss: -0.9633, rewards: 0.7395\n",
      "Iteration: 1890, Train loss: -0.9572, rewards: 0.7317\n",
      "Iteration: 1895, Train loss: -0.9640, rewards: 0.7119\n",
      "Iteration: 1900, Train loss: -1.0266, rewards: 0.7210\n",
      "Eval:\n",
      "Hits@1: 0.6517, Hits@3: 0.7811, Hits@10: 0.7861, MRR: 0.7170\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -0.9437, rewards: 0.7365\n",
      "Iteration: 1910, Train loss: -1.0084, rewards: 0.7454\n",
      "Iteration: 1915, Train loss: -1.0219, rewards: 0.7351\n",
      "Iteration: 1920, Train loss: -0.7877, rewards: 0.7252\n",
      "Iteration: 1925, Train loss: -0.9336, rewards: 0.7188\n",
      "Iteration: 1930, Train loss: -0.9577, rewards: 0.7421\n",
      "Iteration: 1935, Train loss: -1.1104, rewards: 0.6455\n",
      "Iteration: 1940, Train loss: -1.1178, rewards: 0.1833\n",
      "Iteration: 1945, Train loss: -0.9140, rewards: 0.3236\n",
      "Iteration: 1950, Train loss: -0.5896, rewards: 0.6924\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7811, Hits@10: 0.7910, MRR: 0.7465\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -0.7237, rewards: 0.6937\n",
      "Iteration: 1960, Train loss: -0.6456, rewards: 0.7013\n",
      "Iteration: 1965, Train loss: -0.6104, rewards: 0.6642\n",
      "Iteration: 1970, Train loss: -0.6423, rewards: 0.6939\n",
      "Iteration: 1975, Train loss: -0.6196, rewards: 0.7361\n",
      "Iteration: 1980, Train loss: -0.5215, rewards: 0.7690\n",
      "Iteration: 1985, Train loss: -0.6227, rewards: 0.7343\n",
      "Iteration: 1990, Train loss: -0.6671, rewards: 0.7387\n",
      "Iteration: 1995, Train loss: -0.7762, rewards: 0.6793\n",
      "Iteration: 2000, Train loss: -0.7508, rewards: 0.7212\n",
      "Eval:\n",
      "Hits@1: 0.7214, Hits@3: 0.7711, Hits@10: 0.8010, MRR: 0.7485\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/athletehomestadium//test_beam/ ]\n",
      "Hits@1: 0.6915, Hits@3: 0.7413, Hits@10: 0.8010, MRR: 0.7247\n",
      "AthleteHomeStadium\n",
      "MINERVA MAP: 0.8571785732233493 (201 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 22:25:45,644]\u001b[0m Trial 1 finished with value: 0.8571785732233493 and parameters: {'lr': 0.0006961326739169526, 'bs': 84, 'b': 0.24980966352985412, 'l': 0.1586574991581901, 'ee': 50}. Best is trial 0 with value: 0.8576843416395655.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.2270, rewards: 0.1526\n",
      "Iteration: 20, Train loss: -0.2116, rewards: 0.6513\n",
      "Iteration: 30, Train loss: -0.1322, rewards: 0.6336\n",
      "Iteration: 40, Train loss: -0.0450, rewards: 0.7087\n",
      "Iteration: 50, Train loss: -0.0171, rewards: 0.6673\n",
      "Iteration: 60, Train loss: -0.0181, rewards: 0.6841\n",
      "Iteration: 70, Train loss: -0.0161, rewards: 0.6929\n",
      "Iteration: 80, Train loss: -0.0189, rewards: 0.6589\n",
      "Iteration: 90, Train loss: -0.0168, rewards: 0.6330\n",
      "Iteration: 100, Train loss: -0.0425, rewards: 0.6274\n",
      "Eval:\n",
      "Hits@1: 0.6716, Hits@3: 0.6766, Hits@10: 0.7015, MRR: 0.6789\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.0221, rewards: 0.5842\n",
      "Iteration: 120, Train loss: -0.0368, rewards: 0.6034\n",
      "Iteration: 130, Train loss: -0.0314, rewards: 0.6395\n",
      "Iteration: 140, Train loss: -0.0145, rewards: 0.7007\n",
      "Iteration: 150, Train loss: -0.0179, rewards: 0.6716\n",
      "Iteration: 160, Train loss: -0.0169, rewards: 0.6514\n",
      "Iteration: 170, Train loss: -0.0138, rewards: 0.6737\n",
      "Iteration: 180, Train loss: -0.0109, rewards: 0.6623\n",
      "Iteration: 190, Train loss: -0.0183, rewards: 0.6647\n",
      "Iteration: 200, Train loss: -0.0090, rewards: 0.6639\n",
      "Eval:\n",
      "Hits@1: 0.6716, Hits@3: 0.7065, Hits@10: 0.7164, MRR: 0.6874\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.0132, rewards: 0.6474\n",
      "Iteration: 220, Train loss: -0.0166, rewards: 0.6679\n",
      "Iteration: 230, Train loss: -0.0165, rewards: 0.6821\n",
      "Iteration: 240, Train loss: -0.0065, rewards: 0.6905\n",
      "Iteration: 250, Train loss: -0.0154, rewards: 0.6733\n",
      "Iteration: 260, Train loss: -0.0163, rewards: 0.6916\n",
      "Iteration: 270, Train loss: -0.0088, rewards: 0.6558\n",
      "Iteration: 280, Train loss: -0.0119, rewards: 0.6623\n",
      "Iteration: 290, Train loss: -0.0091, rewards: 0.6737\n",
      "Iteration: 300, Train loss: -0.0135, rewards: 0.7042\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7142\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.0108, rewards: 0.6843\n",
      "Iteration: 320, Train loss: -0.0122, rewards: 0.6758\n",
      "Iteration: 330, Train loss: -0.0122, rewards: 0.6705\n",
      "Iteration: 340, Train loss: -0.0137, rewards: 0.6842\n",
      "Iteration: 350, Train loss: -0.0098, rewards: 0.6621\n",
      "Iteration: 360, Train loss: -0.0139, rewards: 0.6895\n",
      "Iteration: 370, Train loss: -0.0102, rewards: 0.6589\n",
      "Iteration: 380, Train loss: -0.0059, rewards: 0.6895\n",
      "Iteration: 390, Train loss: -0.0106, rewards: 0.6947\n",
      "Iteration: 400, Train loss: -0.0134, rewards: 0.6937\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.0146, rewards: 0.7011\n",
      "Iteration: 420, Train loss: -0.0182, rewards: 0.7021\n",
      "Iteration: 430, Train loss: -0.0085, rewards: 0.6758\n",
      "Iteration: 440, Train loss: -0.0210, rewards: 0.6789\n",
      "Iteration: 450, Train loss: -0.0121, rewards: 0.6853\n",
      "Iteration: 460, Train loss: -0.0149, rewards: 0.6895\n",
      "Iteration: 470, Train loss: -0.0195, rewards: 0.6947\n",
      "Iteration: 480, Train loss: -0.0126, rewards: 0.6779\n",
      "Iteration: 490, Train loss: -0.0148, rewards: 0.7011\n",
      "Iteration: 500, Train loss: -0.0122, rewards: 0.6600\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.0170, rewards: 0.7011\n",
      "Iteration: 520, Train loss: -0.0115, rewards: 0.6789\n",
      "Iteration: 530, Train loss: -0.0130, rewards: 0.6874\n",
      "Iteration: 540, Train loss: -0.0144, rewards: 0.6768\n",
      "Iteration: 550, Train loss: -0.0135, rewards: 0.6653\n",
      "Iteration: 560, Train loss: -0.0171, rewards: 0.6926\n",
      "Iteration: 570, Train loss: -0.0087, rewards: 0.6926\n",
      "Iteration: 580, Train loss: -0.0171, rewards: 0.6800\n",
      "Iteration: 590, Train loss: -0.0123, rewards: 0.6916\n",
      "Iteration: 600, Train loss: -0.0119, rewards: 0.7021\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.0154, rewards: 0.6874\n",
      "Iteration: 620, Train loss: -0.0093, rewards: 0.6853\n",
      "Iteration: 630, Train loss: -0.0173, rewards: 0.6958\n",
      "Iteration: 640, Train loss: -0.0149, rewards: 0.6611\n",
      "Iteration: 650, Train loss: -0.0085, rewards: 0.6779\n",
      "Iteration: 660, Train loss: -0.0162, rewards: 0.7021\n",
      "Iteration: 670, Train loss: -0.0167, rewards: 0.6905\n",
      "Iteration: 680, Train loss: -0.0067, rewards: 0.6589\n",
      "Iteration: 690, Train loss: -0.0104, rewards: 0.6526\n",
      "Iteration: 700, Train loss: -0.0136, rewards: 0.6832\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.0125, rewards: 0.7137\n",
      "Iteration: 720, Train loss: -0.0137, rewards: 0.6547\n",
      "Iteration: 730, Train loss: -0.0115, rewards: 0.6958\n",
      "Iteration: 740, Train loss: -0.0114, rewards: 0.6516\n",
      "Iteration: 750, Train loss: -0.0129, rewards: 0.6737\n",
      "Iteration: 760, Train loss: -0.0148, rewards: 0.6695\n",
      "Iteration: 770, Train loss: -0.0097, rewards: 0.6779\n",
      "Iteration: 780, Train loss: -0.0193, rewards: 0.6726\n",
      "Iteration: 790, Train loss: -0.0181, rewards: 0.6474\n",
      "Iteration: 800, Train loss: -0.0133, rewards: 0.6884\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -0.0108, rewards: 0.6442\n",
      "Iteration: 820, Train loss: -0.0148, rewards: 0.6737\n",
      "Iteration: 830, Train loss: -0.0156, rewards: 0.6968\n",
      "Iteration: 840, Train loss: -0.0130, rewards: 0.6968\n",
      "Iteration: 850, Train loss: -0.0074, rewards: 0.6853\n",
      "Iteration: 860, Train loss: -0.0123, rewards: 0.6884\n",
      "Iteration: 870, Train loss: -0.0192, rewards: 0.7011\n",
      "Iteration: 880, Train loss: -0.0115, rewards: 0.6537\n",
      "Iteration: 890, Train loss: -0.0106, rewards: 0.6747\n",
      "Iteration: 900, Train loss: -0.0109, rewards: 0.6832\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.0051, rewards: 0.6737\n",
      "Iteration: 920, Train loss: -0.0169, rewards: 0.6379\n",
      "Iteration: 930, Train loss: -0.0150, rewards: 0.6937\n",
      "Iteration: 940, Train loss: -0.0157, rewards: 0.6768\n",
      "Iteration: 950, Train loss: -0.0122, rewards: 0.6958\n",
      "Iteration: 960, Train loss: -0.0125, rewards: 0.6537\n",
      "Iteration: 970, Train loss: -0.0144, rewards: 0.6821\n",
      "Iteration: 980, Train loss: -0.0133, rewards: 0.6842\n",
      "Iteration: 990, Train loss: -0.0144, rewards: 0.6684\n",
      "Iteration: 1000, Train loss: -0.0061, rewards: 0.6926\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.0112, rewards: 0.7011\n",
      "Iteration: 1020, Train loss: -0.0097, rewards: 0.6853\n",
      "Iteration: 1030, Train loss: -0.0128, rewards: 0.6779\n",
      "Iteration: 1040, Train loss: -0.0173, rewards: 0.6821\n",
      "Iteration: 1050, Train loss: -0.0231, rewards: 0.6789\n",
      "Iteration: 1060, Train loss: -0.0109, rewards: 0.6811\n",
      "Iteration: 1070, Train loss: -0.0125, rewards: 0.6811\n",
      "Iteration: 1080, Train loss: -0.0046, rewards: 0.6863\n",
      "Iteration: 1090, Train loss: -0.0175, rewards: 0.6758\n",
      "Iteration: 1100, Train loss: -0.0154, rewards: 0.6779\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.0134, rewards: 0.6958\n",
      "Iteration: 1120, Train loss: -0.0194, rewards: 0.7063\n",
      "Iteration: 1130, Train loss: -0.0125, rewards: 0.6853\n",
      "Iteration: 1140, Train loss: -0.0104, rewards: 0.6726\n",
      "Iteration: 1150, Train loss: -0.0136, rewards: 0.6863\n",
      "Iteration: 1160, Train loss: -0.0089, rewards: 0.6779\n",
      "Iteration: 1170, Train loss: -0.0123, rewards: 0.6663\n",
      "Iteration: 1180, Train loss: -0.0152, rewards: 0.7021\n",
      "Iteration: 1190, Train loss: -0.0166, rewards: 0.6726\n",
      "Iteration: 1200, Train loss: -0.0127, rewards: 0.6832\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.0103, rewards: 0.6800\n",
      "Iteration: 1220, Train loss: -0.0094, rewards: 0.6958\n",
      "Iteration: 1230, Train loss: -0.0124, rewards: 0.6737\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.0181, rewards: 0.6653\n",
      "Iteration: 1250, Train loss: -0.0138, rewards: 0.6905\n",
      "Iteration: 1260, Train loss: -0.0104, rewards: 0.6811\n",
      "Iteration: 1270, Train loss: -0.0124, rewards: 0.6726\n",
      "Iteration: 1280, Train loss: -0.0107, rewards: 0.6926\n",
      "Iteration: 1290, Train loss: -0.0187, rewards: 0.6768\n",
      "Iteration: 1300, Train loss: -0.0245, rewards: 0.6674\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.0082, rewards: 0.6842\n",
      "Iteration: 1320, Train loss: -0.0102, rewards: 0.6747\n",
      "Iteration: 1330, Train loss: -0.0142, rewards: 0.6726\n",
      "Iteration: 1340, Train loss: -0.0118, rewards: 0.6863\n",
      "Iteration: 1350, Train loss: -0.0094, rewards: 0.6758\n",
      "Iteration: 1360, Train loss: -0.0112, rewards: 0.6905\n",
      "Iteration: 1370, Train loss: -0.0121, rewards: 0.6642\n",
      "Iteration: 1380, Train loss: -0.0207, rewards: 0.6905\n",
      "Iteration: 1390, Train loss: -0.0076, rewards: 0.6895\n",
      "Iteration: 1400, Train loss: -0.0155, rewards: 0.6821\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.0150, rewards: 0.7179\n",
      "Iteration: 1420, Train loss: -0.0106, rewards: 0.6874\n",
      "Iteration: 1430, Train loss: -0.0059, rewards: 0.6758\n",
      "Iteration: 1440, Train loss: -0.0065, rewards: 0.6779\n",
      "Iteration: 1450, Train loss: -0.0137, rewards: 0.6895\n",
      "Iteration: 1460, Train loss: -0.0136, rewards: 0.6716\n",
      "Iteration: 1470, Train loss: -0.0129, rewards: 0.6705\n",
      "Iteration: 1480, Train loss: -0.0154, rewards: 0.6789\n",
      "Iteration: 1490, Train loss: -0.0117, rewards: 0.6916\n",
      "Iteration: 1500, Train loss: -0.0094, rewards: 0.6947\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.0124, rewards: 0.6526\n",
      "Iteration: 1520, Train loss: -0.0112, rewards: 0.6937\n",
      "Iteration: 1530, Train loss: -0.0145, rewards: 0.6716\n",
      "Iteration: 1540, Train loss: -0.0056, rewards: 0.6979\n",
      "Iteration: 1550, Train loss: -0.0112, rewards: 0.6968\n",
      "Iteration: 1560, Train loss: -0.0105, rewards: 0.6611\n",
      "Iteration: 1570, Train loss: -0.0119, rewards: 0.6747\n",
      "Iteration: 1580, Train loss: -0.0116, rewards: 0.6695\n",
      "Iteration: 1590, Train loss: -0.0094, rewards: 0.6537\n",
      "Iteration: 1600, Train loss: -0.0110, rewards: 0.6874\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.0165, rewards: 0.6853\n",
      "Iteration: 1620, Train loss: -0.0077, rewards: 0.6968\n",
      "Iteration: 1630, Train loss: -0.0076, rewards: 0.6726\n",
      "Iteration: 1640, Train loss: -0.0041, rewards: 0.6979\n",
      "Iteration: 1650, Train loss: -0.0113, rewards: 0.6600\n",
      "Iteration: 1660, Train loss: -0.0161, rewards: 0.6863\n",
      "Iteration: 1670, Train loss: -0.0132, rewards: 0.6547\n",
      "Iteration: 1680, Train loss: -0.0117, rewards: 0.6884\n",
      "Iteration: 1690, Train loss: -0.0121, rewards: 0.7116\n",
      "Iteration: 1700, Train loss: -0.0160, rewards: 0.6811\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -0.0087, rewards: 0.6726\n",
      "Iteration: 1720, Train loss: -0.0193, rewards: 0.6821\n",
      "Iteration: 1730, Train loss: -0.0118, rewards: 0.7032\n",
      "Iteration: 1740, Train loss: -0.0129, rewards: 0.6800\n",
      "Iteration: 1750, Train loss: -0.0079, rewards: 0.6832\n",
      "Iteration: 1760, Train loss: -0.0105, rewards: 0.6789\n",
      "Iteration: 1770, Train loss: -0.0104, rewards: 0.6863\n",
      "Iteration: 1780, Train loss: -0.0099, rewards: 0.6558\n",
      "Iteration: 1790, Train loss: -0.0125, rewards: 0.6863\n",
      "Iteration: 1800, Train loss: -0.0106, rewards: 0.7105\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.0115, rewards: 0.6842\n",
      "Iteration: 1820, Train loss: -0.0140, rewards: 0.6895\n",
      "Iteration: 1830, Train loss: -0.0185, rewards: 0.6337\n",
      "Iteration: 1840, Train loss: -0.0157, rewards: 0.6716\n",
      "Iteration: 1850, Train loss: -0.0147, rewards: 0.6705\n",
      "Iteration: 1860, Train loss: -0.0168, rewards: 0.6579\n",
      "Iteration: 1870, Train loss: -0.0125, rewards: 0.6958\n",
      "Iteration: 1880, Train loss: -0.0144, rewards: 0.6716\n",
      "Iteration: 1890, Train loss: -0.0113, rewards: 0.6884\n",
      "Iteration: 1900, Train loss: -0.0129, rewards: 0.6811\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -0.0137, rewards: 0.6916\n",
      "Iteration: 1920, Train loss: -0.0072, rewards: 0.6695\n",
      "Iteration: 1930, Train loss: -0.0113, rewards: 0.6842\n",
      "Iteration: 1940, Train loss: -0.0111, rewards: 0.6695\n",
      "Iteration: 1950, Train loss: -0.0114, rewards: 0.6621\n",
      "Iteration: 1960, Train loss: -0.0130, rewards: 0.6989\n",
      "Iteration: 1970, Train loss: -0.0124, rewards: 0.6779\n",
      "Iteration: 1980, Train loss: -0.0169, rewards: 0.6853\n",
      "Iteration: 1990, Train loss: -0.0149, rewards: 0.6947\n",
      "Iteration: 2000, Train loss: -0.0166, rewards: 0.6716\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7164, Hits@10: 0.7264, MRR: 0.7133\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/athletehomestadium//test_beam/ ]\n",
      "Hits@1: 0.7463, Hits@3: 0.7711, Hits@10: 0.7711, MRR: 0.7585\n",
      "AthleteHomeStadium\n",
      "MINERVA MAP: 0.8590424500872261 (201 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 23:15:58,645]\u001b[0m Trial 2 finished with value: 0.8590424500872261 and parameters: {'lr': 0.009782512377197659, 'bs': 95, 'b': 0.20958043072342875, 'l': 0.3032490999883034, 'ee': 100}. Best is trial 2 with value: 0.8590424500872261.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.8591, rewards: 0.3905\n",
      "Iteration: 20, Train loss: -1.0692, rewards: 0.5372\n",
      "Iteration: 30, Train loss: -0.9592, rewards: 0.6311\n",
      "Iteration: 40, Train loss: -0.9017, rewards: 0.6906\n",
      "Iteration: 50, Train loss: -1.0107, rewards: 0.6620\n",
      "Iteration: 60, Train loss: -0.8272, rewards: 0.7138\n",
      "Iteration: 70, Train loss: -0.8636, rewards: 0.6679\n",
      "Iteration: 80, Train loss: -0.8110, rewards: 0.6959\n",
      "Iteration: 90, Train loss: -0.8621, rewards: 0.6889\n",
      "Iteration: 100, Train loss: -0.9611, rewards: 0.6520\n",
      "Eval:\n",
      "Hits@1: 0.3881, Hits@3: 0.6866, Hits@10: 0.7662, MRR: 0.5136\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.7718, rewards: 0.6949\n",
      "Iteration: 120, Train loss: -0.8185, rewards: 0.6794\n",
      "Iteration: 130, Train loss: -0.9383, rewards: 0.6766\n",
      "Iteration: 140, Train loss: -0.8641, rewards: 0.7009\n",
      "Iteration: 150, Train loss: -0.8782, rewards: 0.6881\n",
      "Iteration: 160, Train loss: -0.7849, rewards: 0.7111\n",
      "Iteration: 170, Train loss: -0.7910, rewards: 0.7072\n",
      "Iteration: 180, Train loss: -0.9673, rewards: 0.6644\n",
      "Iteration: 190, Train loss: -0.8649, rewards: 0.7298\n",
      "Iteration: 200, Train loss: -0.7047, rewards: 0.7291\n",
      "Eval:\n",
      "Hits@1: 0.3632, Hits@3: 0.6418, Hits@10: 0.7811, MRR: 0.4908\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.8039, rewards: 0.7184\n",
      "Iteration: 220, Train loss: -0.8237, rewards: 0.7149\n",
      "Iteration: 230, Train loss: -0.8741, rewards: 0.7337\n",
      "Iteration: 240, Train loss: -0.7002, rewards: 0.7486\n",
      "Iteration: 250, Train loss: -0.8589, rewards: 0.6927\n",
      "Iteration: 260, Train loss: -0.7820, rewards: 0.7284\n",
      "Iteration: 270, Train loss: -0.8410, rewards: 0.6971\n",
      "Iteration: 280, Train loss: -0.8582, rewards: 0.7113\n",
      "Iteration: 290, Train loss: -0.8148, rewards: 0.7256\n",
      "Iteration: 300, Train loss: -0.8142, rewards: 0.7082\n",
      "Eval:\n",
      "Hits@1: 0.4030, Hits@3: 0.6965, Hits@10: 0.7910, MRR: 0.5312\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.7729, rewards: 0.7230\n",
      "Iteration: 320, Train loss: -0.8600, rewards: 0.7078\n",
      "Iteration: 330, Train loss: -0.8171, rewards: 0.7405\n",
      "Iteration: 340, Train loss: -0.7594, rewards: 0.7671\n",
      "Iteration: 350, Train loss: -0.9317, rewards: 0.7299\n",
      "Iteration: 360, Train loss: -0.9013, rewards: 0.6943\n",
      "Iteration: 370, Train loss: -0.7915, rewards: 0.7511\n",
      "Iteration: 380, Train loss: -0.7550, rewards: 0.7754\n",
      "Iteration: 390, Train loss: -0.8699, rewards: 0.7177\n",
      "Iteration: 400, Train loss: -0.7520, rewards: 0.7617\n",
      "Eval:\n",
      "Hits@1: 0.5821, Hits@3: 0.7463, Hits@10: 0.7910, MRR: 0.6529\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.7196, rewards: 0.7491\n",
      "Iteration: 420, Train loss: -0.8403, rewards: 0.7389\n",
      "Iteration: 430, Train loss: -0.7225, rewards: 0.7354\n",
      "Iteration: 440, Train loss: -0.8855, rewards: 0.7695\n",
      "Iteration: 450, Train loss: -0.8570, rewards: 0.7469\n",
      "Iteration: 460, Train loss: -0.8239, rewards: 0.7552\n",
      "Iteration: 470, Train loss: -0.8375, rewards: 0.7593\n",
      "Iteration: 480, Train loss: -0.9323, rewards: 0.7099\n",
      "Iteration: 490, Train loss: -0.8553, rewards: 0.7361\n",
      "Iteration: 500, Train loss: -0.8535, rewards: 0.7214\n",
      "Eval:\n",
      "Hits@1: 0.6667, Hits@3: 0.7811, Hits@10: 0.8060, MRR: 0.7284\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.8167, rewards: 0.7526\n",
      "Iteration: 520, Train loss: -0.7913, rewards: 0.7411\n",
      "Iteration: 530, Train loss: -0.9431, rewards: 0.7385\n",
      "Iteration: 540, Train loss: -0.9562, rewards: 0.7433\n",
      "Iteration: 550, Train loss: -0.7437, rewards: 0.7729\n",
      "Iteration: 560, Train loss: -0.8150, rewards: 0.7243\n",
      "Iteration: 570, Train loss: -0.8771, rewards: 0.7454\n",
      "Iteration: 580, Train loss: -0.8755, rewards: 0.7276\n",
      "Iteration: 590, Train loss: -0.8953, rewards: 0.7240\n",
      "Iteration: 600, Train loss: -0.8795, rewards: 0.7317\n",
      "Eval:\n",
      "Hits@1: 0.7264, Hits@3: 0.7811, Hits@10: 0.8010, MRR: 0.7515\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.9353, rewards: 0.7487\n",
      "Iteration: 620, Train loss: -0.9270, rewards: 0.7393\n",
      "Iteration: 630, Train loss: -0.9097, rewards: 0.7054\n",
      "Iteration: 640, Train loss: -0.8918, rewards: 0.7559\n",
      "Iteration: 650, Train loss: -0.7819, rewards: 0.7769\n",
      "Iteration: 660, Train loss: -0.8688, rewards: 0.7624\n",
      "Iteration: 670, Train loss: -0.8993, rewards: 0.7455\n",
      "Iteration: 680, Train loss: -0.8511, rewards: 0.7400\n",
      "Iteration: 690, Train loss: -0.8817, rewards: 0.7529\n",
      "Iteration: 700, Train loss: -0.9200, rewards: 0.7095\n",
      "Eval:\n",
      "Hits@1: 0.7711, Hits@3: 0.7711, Hits@10: 0.8060, MRR: 0.7778\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.9089, rewards: 0.7490\n",
      "Iteration: 720, Train loss: -0.9104, rewards: 0.7301\n",
      "Iteration: 730, Train loss: -0.8885, rewards: 0.7553\n",
      "Iteration: 740, Train loss: -0.9847, rewards: 0.7204\n",
      "Iteration: 750, Train loss: -0.9168, rewards: 0.7316\n",
      "Iteration: 760, Train loss: -0.9660, rewards: 0.7241\n",
      "Iteration: 770, Train loss: -0.8667, rewards: 0.7664\n",
      "Iteration: 780, Train loss: -0.9627, rewards: 0.7049\n",
      "Iteration: 790, Train loss: -0.9424, rewards: 0.7226\n",
      "Iteration: 800, Train loss: -0.9573, rewards: 0.7501\n",
      "Eval:\n",
      "Hits@1: 0.6816, Hits@3: 0.7811, Hits@10: 0.7960, MRR: 0.7207\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -1.0078, rewards: 0.7126\n",
      "Iteration: 820, Train loss: -0.8993, rewards: 0.7431\n",
      "Iteration: 830, Train loss: -0.9134, rewards: 0.7494\n",
      "Iteration: 840, Train loss: -0.8914, rewards: 0.7422\n",
      "Iteration: 850, Train loss: -0.9528, rewards: 0.7512\n",
      "Iteration: 860, Train loss: -1.0018, rewards: 0.7319\n",
      "Iteration: 870, Train loss: -0.9849, rewards: 0.7224\n",
      "Iteration: 880, Train loss: -0.8642, rewards: 0.7586\n",
      "Iteration: 890, Train loss: -0.8331, rewards: 0.7622\n",
      "Iteration: 900, Train loss: -0.8900, rewards: 0.7377\n",
      "Eval:\n",
      "Hits@1: 0.7313, Hits@3: 0.7761, Hits@10: 0.7861, MRR: 0.7530\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.8873, rewards: 0.7494\n",
      "Iteration: 920, Train loss: -0.8985, rewards: 0.7360\n",
      "Iteration: 930, Train loss: -0.8071, rewards: 0.7614\n",
      "Iteration: 940, Train loss: -0.9097, rewards: 0.7685\n",
      "Iteration: 950, Train loss: -0.8883, rewards: 0.7554\n",
      "Iteration: 960, Train loss: -0.9657, rewards: 0.7429\n",
      "Iteration: 970, Train loss: -1.0019, rewards: 0.7066\n",
      "Iteration: 980, Train loss: -0.8848, rewards: 0.7430\n",
      "Iteration: 990, Train loss: -0.9465, rewards: 0.7439\n",
      "Iteration: 1000, Train loss: -0.9121, rewards: 0.7321\n",
      "Eval:\n",
      "Hits@1: 0.7612, Hits@3: 0.7761, Hits@10: 0.7761, MRR: 0.7687\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.9289, rewards: 0.7254\n",
      "Iteration: 1020, Train loss: -0.9222, rewards: 0.7306\n",
      "Iteration: 1030, Train loss: -0.8714, rewards: 0.6769\n",
      "Iteration: 1040, Train loss: -0.8688, rewards: 0.6772\n",
      "Iteration: 1050, Train loss: -0.8781, rewards: 0.7255\n",
      "Iteration: 1060, Train loss: -0.8748, rewards: 0.7154\n",
      "Iteration: 1070, Train loss: -0.9490, rewards: 0.6711\n",
      "Iteration: 1080, Train loss: -0.9055, rewards: 0.6949\n",
      "Iteration: 1090, Train loss: -0.9958, rewards: 0.6711\n",
      "Iteration: 1100, Train loss: -0.9456, rewards: 0.6709\n",
      "Eval:\n",
      "Hits@1: 0.7164, Hits@3: 0.7662, Hits@10: 0.7861, MRR: 0.7436\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.9125, rewards: 0.6706\n",
      "Iteration: 1120, Train loss: -1.1788, rewards: 0.4541\n",
      "Iteration: 1130, Train loss: -0.9155, rewards: 0.6120\n",
      "Iteration: 1140, Train loss: -0.6434, rewards: 0.7244\n",
      "Iteration: 1150, Train loss: -0.6602, rewards: 0.7086\n",
      "Iteration: 1160, Train loss: -0.8195, rewards: 0.7202\n",
      "Iteration: 1170, Train loss: -0.7793, rewards: 0.7331\n",
      "Iteration: 1180, Train loss: -0.7766, rewards: 0.7292\n",
      "Iteration: 1190, Train loss: -0.8577, rewards: 0.7019\n",
      "Iteration: 1200, Train loss: -0.6570, rewards: 0.7404\n",
      "Eval:\n",
      "Hits@1: 0.7413, Hits@3: 0.7761, Hits@10: 0.7811, MRR: 0.7561\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.8378, rewards: 0.7156\n",
      "Iteration: 1220, Train loss: -0.7461, rewards: 0.7282\n",
      "Iteration: 1230, Train loss: -0.6857, rewards: 0.7588\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.7388, rewards: 0.7554\n",
      "Iteration: 1250, Train loss: -0.7566, rewards: 0.7300\n",
      "Iteration: 1260, Train loss: -0.7643, rewards: 0.7299\n",
      "Iteration: 1270, Train loss: -0.8228, rewards: 0.7301\n",
      "Iteration: 1280, Train loss: -0.8702, rewards: 0.7205\n",
      "Iteration: 1290, Train loss: -0.7078, rewards: 0.7157\n",
      "Iteration: 1300, Train loss: -0.9095, rewards: 0.7116\n",
      "Eval:\n",
      "Hits@1: 0.7512, Hits@3: 0.7761, Hits@10: 0.7861, MRR: 0.7626\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.7364, rewards: 0.7609\n",
      "Iteration: 1320, Train loss: -0.7839, rewards: 0.7192\n",
      "Iteration: 1330, Train loss: -0.8327, rewards: 0.7084\n",
      "Iteration: 1340, Train loss: -0.8435, rewards: 0.7456\n",
      "Iteration: 1350, Train loss: -0.7749, rewards: 0.7516\n",
      "Iteration: 1360, Train loss: -0.8061, rewards: 0.7153\n",
      "Iteration: 1370, Train loss: -0.8136, rewards: 0.7354\n",
      "Iteration: 1380, Train loss: -0.7417, rewards: 0.7480\n",
      "Iteration: 1390, Train loss: -0.7853, rewards: 0.7371\n",
      "Iteration: 1400, Train loss: -0.8217, rewards: 0.7338\n",
      "Eval:\n",
      "Hits@1: 0.7612, Hits@3: 0.7761, Hits@10: 0.8060, MRR: 0.7730\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.8495, rewards: 0.7058\n",
      "Iteration: 1420, Train loss: -0.9364, rewards: 0.7078\n",
      "Iteration: 1430, Train loss: -0.8243, rewards: 0.7246\n",
      "Iteration: 1440, Train loss: -0.8060, rewards: 0.7396\n",
      "Iteration: 1450, Train loss: -0.7480, rewards: 0.7476\n",
      "Iteration: 1460, Train loss: -0.7891, rewards: 0.7512\n",
      "Iteration: 1470, Train loss: -0.7793, rewards: 0.7571\n",
      "Iteration: 1480, Train loss: -0.7332, rewards: 0.7699\n",
      "Iteration: 1490, Train loss: -0.8177, rewards: 0.7624\n",
      "Iteration: 1500, Train loss: -0.8606, rewards: 0.7260\n",
      "Eval:\n",
      "Hits@1: 0.7463, Hits@3: 0.7761, Hits@10: 0.8159, MRR: 0.7662\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.7890, rewards: 0.7246\n",
      "Iteration: 1520, Train loss: -0.7838, rewards: 0.7401\n",
      "Iteration: 1530, Train loss: -0.7850, rewards: 0.7231\n",
      "Iteration: 1540, Train loss: -0.7982, rewards: 0.7321\n",
      "Iteration: 1550, Train loss: -0.7992, rewards: 0.7346\n",
      "Iteration: 1560, Train loss: -0.7851, rewards: 0.7256\n",
      "Iteration: 1570, Train loss: -0.8024, rewards: 0.7462\n",
      "Iteration: 1580, Train loss: -0.7826, rewards: 0.7518\n",
      "Iteration: 1590, Train loss: -0.8688, rewards: 0.7140\n",
      "Iteration: 1600, Train loss: -0.9409, rewards: 0.7121\n",
      "Eval:\n",
      "Hits@1: 0.7214, Hits@3: 0.7761, Hits@10: 0.7861, MRR: 0.7447\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.8113, rewards: 0.7209\n",
      "Iteration: 1620, Train loss: -0.7334, rewards: 0.7703\n",
      "Iteration: 1630, Train loss: -0.8718, rewards: 0.7124\n",
      "Iteration: 1640, Train loss: -0.8934, rewards: 0.7091\n",
      "Iteration: 1650, Train loss: -0.8173, rewards: 0.7442\n",
      "Iteration: 1660, Train loss: -0.9262, rewards: 0.6991\n",
      "Iteration: 1670, Train loss: -0.8638, rewards: 0.7491\n",
      "Iteration: 1680, Train loss: -0.7907, rewards: 0.7364\n",
      "Iteration: 1690, Train loss: -0.8708, rewards: 0.7229\n",
      "Iteration: 1700, Train loss: -0.8834, rewards: 0.7256\n",
      "Eval:\n",
      "Hits@1: 0.6816, Hits@3: 0.7711, Hits@10: 0.8010, MRR: 0.7219\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -0.7528, rewards: 0.7724\n",
      "Iteration: 1720, Train loss: -0.8419, rewards: 0.7510\n",
      "Iteration: 1730, Train loss: -0.8429, rewards: 0.7536\n",
      "Iteration: 1740, Train loss: -0.9188, rewards: 0.7282\n",
      "Iteration: 1750, Train loss: -0.8347, rewards: 0.7295\n",
      "Iteration: 1760, Train loss: -0.8962, rewards: 0.7364\n",
      "Iteration: 1770, Train loss: -0.8447, rewards: 0.7401\n",
      "Iteration: 1780, Train loss: -0.9472, rewards: 0.7378\n",
      "Iteration: 1790, Train loss: -0.9081, rewards: 0.7424\n",
      "Iteration: 1800, Train loss: -0.8002, rewards: 0.7639\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.7612, Hits@10: 0.8010, MRR: 0.7284\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.8644, rewards: 0.7146\n",
      "Iteration: 1820, Train loss: -0.9711, rewards: 0.7143\n",
      "Iteration: 1830, Train loss: -0.8886, rewards: 0.7333\n",
      "Iteration: 1840, Train loss: -0.8572, rewards: 0.6898\n",
      "Iteration: 1850, Train loss: -0.8941, rewards: 0.7006\n",
      "Iteration: 1860, Train loss: -0.9054, rewards: 0.7354\n",
      "Iteration: 1870, Train loss: -0.9240, rewards: 0.6882\n",
      "Iteration: 1880, Train loss: -0.8472, rewards: 0.7222\n",
      "Iteration: 1890, Train loss: -0.8987, rewards: 0.7038\n",
      "Iteration: 1900, Train loss: -0.9196, rewards: 0.7119\n",
      "Eval:\n",
      "Hits@1: 0.5871, Hits@3: 0.7612, Hits@10: 0.7662, MRR: 0.6565\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -0.8761, rewards: 0.7178\n",
      "Iteration: 1920, Train loss: -0.8350, rewards: 0.7550\n",
      "Iteration: 1930, Train loss: -0.8430, rewards: 0.7301\n",
      "Iteration: 1940, Train loss: -0.8986, rewards: 0.7246\n",
      "Iteration: 1950, Train loss: -0.8150, rewards: 0.7241\n",
      "Iteration: 1960, Train loss: -0.8378, rewards: 0.7429\n",
      "Iteration: 1970, Train loss: -0.8443, rewards: 0.7475\n",
      "Iteration: 1980, Train loss: -0.8817, rewards: 0.7248\n",
      "Iteration: 1990, Train loss: -0.9353, rewards: 0.7012\n",
      "Iteration: 2000, Train loss: -0.8987, rewards: 0.7167\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7811, Hits@10: 0.8060, MRR: 0.7372\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/athletehomestadium//test_beam/ ]\n",
      "Hits@1: 0.7562, Hits@3: 0.7861, Hits@10: 0.8408, MRR: 0.7798\n",
      "AthleteHomeStadium\n",
      "MINERVA MAP: 0.8681338976115095 (201 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 23:59:17,356]\u001b[0m Trial 3 finished with value: 0.8681338976115095 and parameters: {'lr': 0.0020144052994644666, 'bs': 70, 'b': 0.26467995875972145, 'l': 0.050275890973632054, 'ee': 100}. Best is trial 3 with value: 0.8681338976115095.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.6299, rewards: 0.1643\n",
      "Iteration: 20, Train loss: -0.4584, rewards: 0.6753\n",
      "Iteration: 30, Train loss: -0.5392, rewards: 0.6681\n",
      "Iteration: 40, Train loss: -0.4655, rewards: 0.6296\n",
      "Iteration: 50, Train loss: -0.7179, rewards: 0.5635\n",
      "Iteration: 60, Train loss: -0.6997, rewards: 0.5930\n",
      "Iteration: 70, Train loss: -0.6123, rewards: 0.6303\n",
      "Iteration: 80, Train loss: -0.5883, rewards: 0.6411\n",
      "Iteration: 90, Train loss: -0.7958, rewards: 0.6080\n",
      "Iteration: 100, Train loss: -0.9107, rewards: 0.5786\n",
      "Eval:\n",
      "Hits@1: 0.7164, Hits@3: 0.7264, Hits@10: 0.7761, MRR: 0.7302\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.9184, rewards: 0.6048\n",
      "Iteration: 120, Train loss: -0.9120, rewards: 0.6048\n",
      "Iteration: 130, Train loss: -0.8719, rewards: 0.5871\n",
      "Iteration: 140, Train loss: -0.7474, rewards: 0.6820\n",
      "Iteration: 150, Train loss: -0.8496, rewards: 0.5851\n",
      "Iteration: 160, Train loss: -0.8040, rewards: 0.6739\n",
      "Iteration: 170, Train loss: -0.8984, rewards: 0.6659\n",
      "Iteration: 180, Train loss: -0.7320, rewards: 0.6841\n",
      "Iteration: 190, Train loss: -0.8739, rewards: 0.6720\n",
      "Iteration: 200, Train loss: -0.6923, rewards: 0.7024\n",
      "Eval:\n",
      "Hits@1: 0.4776, Hits@3: 0.7662, Hits@10: 0.8109, MRR: 0.5903\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.7154, rewards: 0.6713\n",
      "Iteration: 220, Train loss: -0.7294, rewards: 0.6934\n",
      "Iteration: 230, Train loss: -0.7483, rewards: 0.6916\n",
      "Iteration: 240, Train loss: -0.6844, rewards: 0.7262\n",
      "Iteration: 250, Train loss: -0.6398, rewards: 0.7190\n",
      "Iteration: 260, Train loss: -0.7235, rewards: 0.7122\n",
      "Iteration: 270, Train loss: -0.6356, rewards: 0.7276\n",
      "Iteration: 280, Train loss: -0.7643, rewards: 0.6972\n",
      "Iteration: 290, Train loss: -0.7152, rewards: 0.7197\n",
      "Iteration: 300, Train loss: -0.7171, rewards: 0.7188\n",
      "Eval:\n",
      "Hits@1: 0.5970, Hits@3: 0.8010, Hits@10: 0.8109, MRR: 0.6978\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.7911, rewards: 0.6972\n",
      "Iteration: 320, Train loss: -0.6327, rewards: 0.7295\n",
      "Iteration: 330, Train loss: -0.6800, rewards: 0.7218\n",
      "Iteration: 340, Train loss: -0.6738, rewards: 0.7249\n",
      "Iteration: 350, Train loss: -0.7372, rewards: 0.7044\n",
      "Iteration: 360, Train loss: -0.7885, rewards: 0.6926\n",
      "Iteration: 370, Train loss: -0.8326, rewards: 0.6790\n",
      "Iteration: 380, Train loss: -0.7539, rewards: 0.7095\n",
      "Iteration: 390, Train loss: -0.7664, rewards: 0.7026\n",
      "Iteration: 400, Train loss: -0.7691, rewards: 0.7227\n",
      "Eval:\n",
      "Hits@1: 0.5672, Hits@3: 0.7910, Hits@10: 0.8159, MRR: 0.6777\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.7757, rewards: 0.6948\n",
      "Iteration: 420, Train loss: -0.7222, rewards: 0.7368\n",
      "Iteration: 430, Train loss: -0.7991, rewards: 0.6953\n",
      "Iteration: 440, Train loss: -0.6781, rewards: 0.7035\n",
      "Iteration: 450, Train loss: -0.6085, rewards: 0.7477\n",
      "Iteration: 460, Train loss: -0.5771, rewards: 0.7437\n",
      "Iteration: 470, Train loss: -0.7148, rewards: 0.7167\n",
      "Iteration: 480, Train loss: -0.6545, rewards: 0.7327\n",
      "Iteration: 490, Train loss: -0.6040, rewards: 0.7482\n",
      "Iteration: 500, Train loss: -0.7276, rewards: 0.7040\n",
      "Eval:\n",
      "Hits@1: 0.5423, Hits@3: 0.7960, Hits@10: 0.8109, MRR: 0.6706\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.7253, rewards: 0.7509\n",
      "Iteration: 520, Train loss: -0.6982, rewards: 0.7129\n",
      "Iteration: 530, Train loss: -0.7158, rewards: 0.7424\n",
      "Iteration: 540, Train loss: -0.6195, rewards: 0.7529\n",
      "Iteration: 550, Train loss: -0.6488, rewards: 0.7511\n",
      "Iteration: 560, Train loss: -0.6759, rewards: 0.7295\n",
      "Iteration: 570, Train loss: -0.7204, rewards: 0.6856\n",
      "Iteration: 580, Train loss: -0.7850, rewards: 0.7432\n",
      "Iteration: 590, Train loss: -0.7136, rewards: 0.7051\n",
      "Iteration: 600, Train loss: -0.7199, rewards: 0.7414\n",
      "Eval:\n",
      "Hits@1: 0.5522, Hits@3: 0.8010, Hits@10: 0.8109, MRR: 0.6669\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.7863, rewards: 0.6926\n",
      "Iteration: 620, Train loss: -0.7118, rewards: 0.7339\n",
      "Iteration: 630, Train loss: -0.6863, rewards: 0.7385\n",
      "Iteration: 640, Train loss: -0.5693, rewards: 0.7560\n",
      "Iteration: 650, Train loss: -0.7151, rewards: 0.7100\n",
      "Iteration: 660, Train loss: -0.7075, rewards: 0.7265\n",
      "Iteration: 670, Train loss: -0.7784, rewards: 0.7213\n",
      "Iteration: 680, Train loss: -0.6754, rewards: 0.7573\n",
      "Iteration: 690, Train loss: -0.7645, rewards: 0.7249\n",
      "Iteration: 700, Train loss: -0.7510, rewards: 0.7224\n",
      "Eval:\n",
      "Hits@1: 0.5920, Hits@3: 0.8010, Hits@10: 0.8159, MRR: 0.6915\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.7875, rewards: 0.7102\n",
      "Iteration: 720, Train loss: -0.7943, rewards: 0.7082\n",
      "Iteration: 730, Train loss: -0.5915, rewards: 0.7610\n",
      "Iteration: 740, Train loss: -0.6487, rewards: 0.7244\n",
      "Iteration: 750, Train loss: -0.7140, rewards: 0.7379\n",
      "Iteration: 760, Train loss: -0.6508, rewards: 0.7446\n",
      "Iteration: 770, Train loss: -0.7641, rewards: 0.7077\n",
      "Iteration: 780, Train loss: -0.7848, rewards: 0.7054\n",
      "Iteration: 790, Train loss: -0.7640, rewards: 0.7048\n",
      "Iteration: 800, Train loss: -0.6929, rewards: 0.7076\n",
      "Eval:\n",
      "Hits@1: 0.5821, Hits@3: 0.8010, Hits@10: 0.8159, MRR: 0.6933\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -0.7141, rewards: 0.7267\n",
      "Iteration: 820, Train loss: -0.6171, rewards: 0.7533\n",
      "Iteration: 830, Train loss: -0.7685, rewards: 0.7173\n",
      "Iteration: 840, Train loss: -0.7091, rewards: 0.7596\n",
      "Iteration: 850, Train loss: -0.6120, rewards: 0.7556\n",
      "Iteration: 860, Train loss: -0.6634, rewards: 0.7613\n",
      "Iteration: 870, Train loss: -0.6676, rewards: 0.7443\n",
      "Iteration: 880, Train loss: -0.6933, rewards: 0.7334\n",
      "Iteration: 890, Train loss: -0.6596, rewards: 0.7715\n",
      "Iteration: 900, Train loss: -0.6348, rewards: 0.7418\n",
      "Eval:\n",
      "Hits@1: 0.5871, Hits@3: 0.7960, Hits@10: 0.8109, MRR: 0.6868\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.6470, rewards: 0.7402\n",
      "Iteration: 920, Train loss: -0.7028, rewards: 0.7562\n",
      "Iteration: 930, Train loss: -0.6839, rewards: 0.7689\n",
      "Iteration: 940, Train loss: -0.7120, rewards: 0.7180\n",
      "Iteration: 950, Train loss: -0.6751, rewards: 0.7434\n",
      "Iteration: 960, Train loss: -0.6809, rewards: 0.7399\n",
      "Iteration: 970, Train loss: -0.6496, rewards: 0.7491\n",
      "Iteration: 980, Train loss: -0.7476, rewards: 0.7017\n",
      "Iteration: 990, Train loss: -0.7636, rewards: 0.7294\n",
      "Iteration: 1000, Train loss: -0.6818, rewards: 0.7291\n",
      "Eval:\n",
      "Hits@1: 0.5473, Hits@3: 0.8010, Hits@10: 0.8060, MRR: 0.6614\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.7978, rewards: 0.7220\n",
      "Iteration: 1020, Train loss: -0.6696, rewards: 0.7239\n",
      "Iteration: 1030, Train loss: -0.6859, rewards: 0.7531\n",
      "Iteration: 1040, Train loss: -0.6264, rewards: 0.7855\n",
      "Iteration: 1050, Train loss: -0.6627, rewards: 0.7324\n",
      "Iteration: 1060, Train loss: -0.7160, rewards: 0.7395\n",
      "Iteration: 1070, Train loss: -0.6972, rewards: 0.7393\n",
      "Iteration: 1080, Train loss: -0.6489, rewards: 0.7380\n",
      "Iteration: 1090, Train loss: -0.7443, rewards: 0.7415\n",
      "Iteration: 1100, Train loss: -0.7010, rewards: 0.7511\n",
      "Eval:\n",
      "Hits@1: 0.5174, Hits@3: 0.7662, Hits@10: 0.8159, MRR: 0.6270\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.6313, rewards: 0.7860\n",
      "Iteration: 1120, Train loss: -0.6111, rewards: 0.7712\n",
      "Iteration: 1130, Train loss: -0.7725, rewards: 0.7206\n",
      "Iteration: 1140, Train loss: -0.7620, rewards: 0.7161\n",
      "Iteration: 1150, Train loss: -0.7663, rewards: 0.6981\n",
      "Iteration: 1160, Train loss: -0.6952, rewards: 0.7270\n",
      "Iteration: 1170, Train loss: -0.6989, rewards: 0.7238\n",
      "Iteration: 1180, Train loss: -0.6834, rewards: 0.7661\n",
      "Iteration: 1190, Train loss: -0.5791, rewards: 0.7537\n",
      "Iteration: 1200, Train loss: -0.7657, rewards: 0.6950\n",
      "Eval:\n",
      "Hits@1: 0.6020, Hits@3: 0.8010, Hits@10: 0.8159, MRR: 0.6865\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.7228, rewards: 0.7337\n",
      "Iteration: 1220, Train loss: -0.6444, rewards: 0.7591\n",
      "Iteration: 1230, Train loss: -0.6149, rewards: 0.7803\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.6204, rewards: 0.7704\n",
      "Iteration: 1250, Train loss: -0.7807, rewards: 0.6978\n",
      "Iteration: 1260, Train loss: -0.7367, rewards: 0.7259\n",
      "Iteration: 1270, Train loss: -0.6913, rewards: 0.7151\n",
      "Iteration: 1280, Train loss: -0.6738, rewards: 0.7571\n",
      "Iteration: 1290, Train loss: -0.6914, rewards: 0.7430\n",
      "Iteration: 1300, Train loss: -0.6041, rewards: 0.7968\n",
      "Eval:\n",
      "Hits@1: 0.5622, Hits@3: 0.7960, Hits@10: 0.8060, MRR: 0.6797\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.5939, rewards: 0.7838\n",
      "Iteration: 1320, Train loss: -0.7428, rewards: 0.7056\n",
      "Iteration: 1330, Train loss: -0.7170, rewards: 0.7335\n",
      "Iteration: 1340, Train loss: -0.7802, rewards: 0.7197\n",
      "Iteration: 1350, Train loss: -0.6742, rewards: 0.7518\n",
      "Iteration: 1360, Train loss: -0.6113, rewards: 0.7445\n",
      "Iteration: 1370, Train loss: -0.7095, rewards: 0.7455\n",
      "Iteration: 1380, Train loss: -0.6541, rewards: 0.7507\n",
      "Iteration: 1390, Train loss: -0.5945, rewards: 0.7577\n",
      "Iteration: 1400, Train loss: -0.5972, rewards: 0.7610\n",
      "Eval:\n",
      "Hits@1: 0.5423, Hits@3: 0.7811, Hits@10: 0.8159, MRR: 0.6436\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.6940, rewards: 0.7248\n",
      "Iteration: 1420, Train loss: -0.7718, rewards: 0.7348\n",
      "Iteration: 1430, Train loss: -0.6619, rewards: 0.7321\n",
      "Iteration: 1440, Train loss: -0.7474, rewards: 0.7198\n",
      "Iteration: 1450, Train loss: -0.6919, rewards: 0.7386\n",
      "Iteration: 1460, Train loss: -0.6546, rewards: 0.7481\n",
      "Iteration: 1470, Train loss: -0.6890, rewards: 0.7524\n",
      "Iteration: 1480, Train loss: -0.6533, rewards: 0.7362\n",
      "Iteration: 1490, Train loss: -0.6553, rewards: 0.7695\n",
      "Iteration: 1500, Train loss: -0.6840, rewards: 0.7407\n",
      "Eval:\n",
      "Hits@1: 0.5423, Hits@3: 0.7761, Hits@10: 0.8159, MRR: 0.6404\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.7324, rewards: 0.7438\n",
      "Iteration: 1520, Train loss: -0.6729, rewards: 0.7714\n",
      "Iteration: 1530, Train loss: -0.6851, rewards: 0.7711\n",
      "Iteration: 1540, Train loss: -0.6892, rewards: 0.7676\n",
      "Iteration: 1550, Train loss: -0.7384, rewards: 0.7384\n",
      "Iteration: 1560, Train loss: -0.7281, rewards: 0.7565\n",
      "Iteration: 1570, Train loss: -0.5638, rewards: 0.7586\n",
      "Iteration: 1580, Train loss: -0.6799, rewards: 0.7131\n",
      "Iteration: 1590, Train loss: -0.2477, rewards: 0.7553\n",
      "Iteration: 1600, Train loss: -0.1647, rewards: 0.7184\n",
      "Eval:\n",
      "Hits@1: 0.6965, Hits@3: 0.7612, Hits@10: 0.8010, MRR: 0.7321\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.0180, rewards: 0.6786\n",
      "Iteration: 1620, Train loss: -0.0133, rewards: 0.6979\n",
      "Iteration: 1630, Train loss: -0.0306, rewards: 0.3745\n",
      "Iteration: 1640, Train loss: -0.0482, rewards: 0.1723\n",
      "Iteration: 1650, Train loss: -0.0426, rewards: 0.1277\n",
      "Iteration: 1660, Train loss: -0.0497, rewards: 0.1447\n",
      "Iteration: 1670, Train loss: -0.0468, rewards: 0.0617\n",
      "Iteration: 1680, Train loss: -0.0784, rewards: 0.3979\n",
      "Iteration: 1690, Train loss: -0.0132, rewards: 0.4213\n",
      "Iteration: 1700, Train loss: -0.0262, rewards: 0.5617\n",
      "Eval:\n",
      "Hits@1: 0.6567, Hits@3: 0.7164, Hits@10: 0.7413, MRR: 0.6943\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -0.0244, rewards: 0.6660\n",
      "Iteration: 1720, Train loss: -0.0150, rewards: 0.6979\n",
      "Iteration: 1730, Train loss: -0.0263, rewards: 0.6979\n",
      "Iteration: 1740, Train loss: -0.0231, rewards: 0.6787\n",
      "Iteration: 1750, Train loss: -0.0229, rewards: 0.6383\n",
      "Iteration: 1760, Train loss: -0.0196, rewards: 0.6596\n",
      "Iteration: 1770, Train loss: -0.0267, rewards: 0.6574\n",
      "Iteration: 1780, Train loss: -0.0253, rewards: 0.6596\n",
      "Iteration: 1790, Train loss: -0.0242, rewards: 0.7319\n",
      "Iteration: 1800, Train loss: -0.0197, rewards: 0.6851\n",
      "Eval:\n",
      "Hits@1: 0.7065, Hits@3: 0.7264, Hits@10: 0.7363, MRR: 0.7217\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.0137, rewards: 0.6830\n"
     ]
    }
   ],
   "source": [
    "sub_task = sub_tasks_list[0]\n",
    "study = optuna.create_study(storage=f\"sqlite:///{sub_task}.db\", study_name=f\"{sub_task}\", direction = 'maximize')\n",
    "study.optimize(objective, n_trials=1000)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
