{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "b2479ab1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-a6f8dd9b-6af8-5e75-8654-84fb2b7b8f6d\"\n",
    "\n",
    "from model.ours3 import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "a39d5a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    \n",
    "    options['use_cuda'] = True\n",
    "    options['vocab_dir'] = '../MINERVA/datasets/data_preprocessed/nell/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_nell995-1/'\n",
    "        options['output_dir'] = './outputs_nell995-1/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_nell995-1/'\n",
    "        options['model_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = 1\n",
    "    options['max_num_actions'] = 40\n",
    "    options['gnn_layer'] = 2\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 40\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = 64\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = 0.15\n",
    "    options['Lambda'] = 0.15\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = 0.00005\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 5\n",
    "    options['total_iterations'] = 20*(64/options['batch_size'])\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "12f1b8ba",
   "metadata": {},
   "outputs": [],
   "source": [
    "params = set_params()\n",
    "params['test_rollouts'] = 100\n",
    "params['max_num_actions'] = 100\n",
    "params['eval_batch_size'] = 8\n",
    "\n",
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "17bc5425",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8207787473535506 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6278593427818233 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.572523027000639 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8249362244897959 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9319237147595357 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.9153204137843777 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.8065181795751745 (193 queries evaluated)\n",
      "WorksFor.txt\n",
      "MINERVA MAP: 0.8287528177373783 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.9408317251690747 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8386739927983896 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "map_list = {}    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "    \n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    map_list[sub_task] = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              trainer.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "dd2edd24",
   "metadata": {},
   "outputs": [],
   "source": [
    "import optuna\n",
    "from model.ours3 import *\n",
    "global sub_tasks_list\n",
    "\n",
    "sub_tasks_list = [\n",
    "# 'AthletePlaysInLeague',\n",
    "# 'AthletePlaysForTeam ',\n",
    "# 'AthleteHomeStadium ',\n",
    "# 'TeamPlaysSport',\n",
    "# 'AthletePlaysSport',\n",
    "# 'OrganizationHiredPerson',\n",
    "# 'PersonBornInLocation',\n",
    "# 'WorksFor',\n",
    "# 'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "\n",
    "\n",
    "def objective(trial):\n",
    "    \n",
    "    sub_task = sub_tasks_list[0]\n",
    "\n",
    "    lr = trial.suggest_float('lr', 1e-6, 1e-2)\n",
    "    bs = trial.suggest_int('bs', 4, 128)\n",
    "    b = trial.suggest_float('b', 0, 0.5)\n",
    "    l = trial.suggest_float('l', 0, 0.5)\n",
    "    ee = trial.suggest_categorical('ee', [10,20,50,100])\n",
    "\n",
    "    params = set_params(sub_task.lower().strip())\n",
    "    params['learning_rate'] = lr\n",
    "    params['eval_every'] = ee\n",
    "    params['batch_size'] = bs\n",
    "    params['beta'] = b\n",
    "    params['Lambda'] = l\n",
    "    params['total_iterations'] = min(50*params['eval_every'], 2000)\n",
    "\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    #     torch.save(sub_trainer.agent.state_dict(), params['model_dir'] + 'tmp.ckpt')\n",
    "\n",
    "    params['test_rollouts'] = 100\n",
    "    params['max_num_actions'] = 100\n",
    "    params['eval_batch_size'] = 8\n",
    "\n",
    "    sub_tester = Trainer(params)\n",
    "    sub_tester.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_tester.agent.eval()\n",
    "\n",
    "    save_path = sub_tester.save_path\n",
    "    output_dir = sub_tester.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_tester.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_tester.test_environment = sub_tester.test_test_environment\n",
    "    test_results = sub_tester.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_tester.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "\n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              sub_tester.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')\n",
    "\n",
    "    del sub_tester, sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()\n",
    "    \n",
    "    return MAP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "74bc15d8",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:11:03,246]\u001b[0m A new study created in RDB with name: PersonLeadsOrganization\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 1, Train loss: -0.5979, rewards: 0.6087\n",
      "Iteration: 2, Train loss: -0.7474, rewards: 0.5802\n",
      "Iteration: 3, Train loss: -0.6236, rewards: 0.4934\n",
      "Iteration: 4, Train loss: -0.7398, rewards: 0.5979\n",
      "Iteration: 5, Train loss: -0.5418, rewards: 0.6215\n",
      "Iteration: 6, Train loss: -0.8979, rewards: 0.5793\n",
      "Iteration: 7, Train loss: -0.8141, rewards: 0.5417\n",
      "Iteration: 8, Train loss: -0.8485, rewards: 0.5682\n",
      "Iteration: 9, Train loss: -0.7572, rewards: 0.6281\n",
      "Iteration: 10, Train loss: -0.7439, rewards: 0.5901\n",
      "Eval:\n",
      "Hits@1: 0.6359, Hits@3: 0.6774, Hits@10: 0.7051, MRR: 0.6611\n",
      "------------------------------------------------------------\n",
      "Iteration: 11, Train loss: -0.8955, rewards: 0.5996\n",
      "Iteration: 12, Train loss: -0.7353, rewards: 0.5698\n",
      "Iteration: 13, Train loss: -0.9421, rewards: 0.5727\n",
      "Iteration: 14, Train loss: -0.8946, rewards: 0.5537\n",
      "Iteration: 15, Train loss: -0.8624, rewards: 0.6025\n",
      "Iteration: 16, Train loss: -0.8150, rewards: 0.6174\n",
      "Iteration: 17, Train loss: -0.8925, rewards: 0.6682\n",
      "Iteration: 18, Train loss: -0.7280, rewards: 0.6591\n",
      "Iteration: 19, Train loss: -0.7970, rewards: 0.6417\n",
      "Iteration: 20, Train loss: -0.8599, rewards: 0.5132\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6866, Hits@10: 0.7143, MRR: 0.6765\n",
      "------------------------------------------------------------\n",
      "Iteration: 21, Train loss: -0.6871, rewards: 0.7157\n",
      "Iteration: 22, Train loss: -0.7554, rewards: 0.5525\n",
      "Iteration: 23, Train loss: -0.9262, rewards: 0.5562\n",
      "Iteration: 24, Train loss: -0.7242, rewards: 0.6298\n",
      "Iteration: 25, Train loss: -0.7154, rewards: 0.5905\n",
      "Iteration: 26, Train loss: -0.9807, rewards: 0.6116\n",
      "Iteration: 27, Train loss: -0.9898, rewards: 0.5855\n",
      "Iteration: 28, Train loss: -0.6986, rewards: 0.6074\n",
      "Iteration: 29, Train loss: -0.9149, rewards: 0.5616\n",
      "Iteration: 30, Train loss: -0.8216, rewards: 0.6570\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7005, MRR: 0.6759\n",
      "------------------------------------------------------------\n",
      "Iteration: 31, Train loss: -0.8586, rewards: 0.5868\n",
      "Iteration: 32, Train loss: -0.8700, rewards: 0.6397\n",
      "Iteration: 33, Train loss: -0.8491, rewards: 0.6347\n",
      "Iteration: 34, Train loss: -0.6469, rewards: 0.6277\n",
      "Iteration: 35, Train loss: -0.8510, rewards: 0.5884\n",
      "Iteration: 36, Train loss: -0.8205, rewards: 0.5839\n",
      "Iteration: 37, Train loss: -0.8039, rewards: 0.6843\n",
      "Iteration: 38, Train loss: -0.8366, rewards: 0.5566\n",
      "Iteration: 39, Train loss: -0.9551, rewards: 0.5802\n",
      "Iteration: 40, Train loss: -0.9180, rewards: 0.6157\n",
      "Eval:\n",
      "Hits@1: 0.6498, Hits@3: 0.6912, Hits@10: 0.6912, MRR: 0.6716\n",
      "------------------------------------------------------------\n",
      "Iteration: 41, Train loss: -0.8301, rewards: 0.7062\n",
      "Iteration: 42, Train loss: -0.5905, rewards: 0.6760\n",
      "Iteration: 43, Train loss: -0.8243, rewards: 0.6140\n",
      "Iteration: 44, Train loss: -0.9333, rewards: 0.7025\n",
      "Iteration: 45, Train loss: -0.9589, rewards: 0.6847\n",
      "Iteration: 46, Train loss: -0.9221, rewards: 0.6950\n",
      "Iteration: 47, Train loss: -0.8182, rewards: 0.6888\n",
      "Iteration: 48, Train loss: -0.7746, rewards: 0.6103\n",
      "Iteration: 49, Train loss: -0.9083, rewards: 0.5921\n",
      "Iteration: 50, Train loss: -0.7937, rewards: 0.6537\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6912, Hits@10: 0.6912, MRR: 0.6894\n",
      "------------------------------------------------------------\n",
      "Iteration: 51, Train loss: -0.8201, rewards: 0.6355\n",
      "Iteration: 52, Train loss: -0.8159, rewards: 0.6579\n",
      "Iteration: 53, Train loss: -0.7728, rewards: 0.6393\n",
      "Iteration: 54, Train loss: -0.8269, rewards: 0.7140\n",
      "Iteration: 55, Train loss: -0.6850, rewards: 0.6967\n",
      "Iteration: 56, Train loss: -0.9360, rewards: 0.7289\n",
      "Iteration: 57, Train loss: -0.7871, rewards: 0.7434\n",
      "Iteration: 58, Train loss: -0.8174, rewards: 0.7318\n",
      "Iteration: 59, Train loss: -0.8880, rewards: 0.6612\n",
      "Iteration: 60, Train loss: -0.9627, rewards: 0.5517\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6843\n",
      "------------------------------------------------------------\n",
      "Iteration: 61, Train loss: -0.8240, rewards: 0.6682\n",
      "Iteration: 62, Train loss: -0.9187, rewards: 0.6475\n",
      "Iteration: 63, Train loss: -0.8603, rewards: 0.7107\n",
      "Iteration: 64, Train loss: -0.9045, rewards: 0.6702\n",
      "Iteration: 65, Train loss: -0.8245, rewards: 0.5938\n",
      "Iteration: 66, Train loss: -0.8674, rewards: 0.6917\n",
      "Iteration: 67, Train loss: -0.9839, rewards: 0.6074\n",
      "Iteration: 68, Train loss: -0.9280, rewards: 0.6264\n",
      "Iteration: 69, Train loss: -0.8032, rewards: 0.6826\n",
      "Iteration: 70, Train loss: -1.0216, rewards: 0.6269\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6959, MRR: 0.6869\n",
      "------------------------------------------------------------\n",
      "Iteration: 71, Train loss: -0.8891, rewards: 0.7124\n",
      "Iteration: 72, Train loss: -0.7118, rewards: 0.7285\n",
      "Iteration: 73, Train loss: -0.7591, rewards: 0.7169\n",
      "Iteration: 74, Train loss: -0.7648, rewards: 0.6632\n",
      "Iteration: 75, Train loss: -0.6984, rewards: 0.7347\n",
      "Iteration: 76, Train loss: -0.9034, rewards: 0.6335\n",
      "Iteration: 77, Train loss: -0.8607, rewards: 0.6719\n",
      "Iteration: 78, Train loss: -0.7192, rewards: 0.6975\n",
      "Iteration: 79, Train loss: -0.7961, rewards: 0.6244\n",
      "Iteration: 80, Train loss: -0.8297, rewards: 0.6839\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.7005, MRR: 0.6870\n",
      "------------------------------------------------------------\n",
      "Iteration: 81, Train loss: -0.8009, rewards: 0.6793\n",
      "Iteration: 82, Train loss: -0.7641, rewards: 0.6645\n",
      "Iteration: 83, Train loss: -0.9607, rewards: 0.6475\n",
      "Iteration: 84, Train loss: -0.9207, rewards: 0.6525\n",
      "Iteration: 85, Train loss: -0.7925, rewards: 0.6421\n",
      "Iteration: 86, Train loss: -0.6667, rewards: 0.7442\n",
      "Iteration: 87, Train loss: -0.8067, rewards: 0.6822\n",
      "Iteration: 88, Train loss: -1.0001, rewards: 0.6814\n",
      "Iteration: 89, Train loss: -0.9255, rewards: 0.6669\n",
      "Iteration: 90, Train loss: -0.7361, rewards: 0.6161\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6866, MRR: 0.6861\n",
      "------------------------------------------------------------\n",
      "Iteration: 91, Train loss: -0.8085, rewards: 0.7120\n",
      "Iteration: 92, Train loss: -0.6828, rewards: 0.6851\n",
      "Iteration: 93, Train loss: -0.7391, rewards: 0.7174\n",
      "Iteration: 94, Train loss: -0.9691, rewards: 0.6789\n",
      "Iteration: 95, Train loss: -0.8921, rewards: 0.6649\n",
      "Iteration: 96, Train loss: -0.8769, rewards: 0.7459\n",
      "Iteration: 97, Train loss: -0.7802, rewards: 0.7269\n",
      "Iteration: 98, Train loss: -0.8221, rewards: 0.6736\n",
      "Iteration: 99, Train loss: -0.8535, rewards: 0.7252\n",
      "Iteration: 100, Train loss: -0.7030, rewards: 0.6661\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6834\n",
      "------------------------------------------------------------\n",
      "Iteration: 101, Train loss: -0.9030, rewards: 0.7029\n",
      "Iteration: 102, Train loss: -0.8318, rewards: 0.6678\n",
      "Iteration: 103, Train loss: -0.9033, rewards: 0.5971\n",
      "Iteration: 104, Train loss: -0.7780, rewards: 0.7450\n",
      "Iteration: 105, Train loss: -0.8298, rewards: 0.6736\n",
      "Iteration: 106, Train loss: -1.0423, rewards: 0.7074\n",
      "Iteration: 107, Train loss: -0.8255, rewards: 0.7219\n",
      "Iteration: 108, Train loss: -0.7978, rewards: 0.7227\n",
      "Iteration: 109, Train loss: -0.7893, rewards: 0.6136\n",
      "Iteration: 110, Train loss: -0.9663, rewards: 0.6421\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6866, MRR: 0.6853\n",
      "------------------------------------------------------------\n",
      "Iteration: 111, Train loss: -0.9993, rewards: 0.6388\n",
      "Iteration: 112, Train loss: -0.8539, rewards: 0.6174\n",
      "Iteration: 113, Train loss: -0.8014, rewards: 0.7306\n",
      "Iteration: 114, Train loss: -0.9026, rewards: 0.6380\n",
      "Iteration: 115, Train loss: -0.8388, rewards: 0.7045\n",
      "Iteration: 116, Train loss: -1.0397, rewards: 0.5843\n",
      "Iteration: 117, Train loss: -0.9292, rewards: 0.6517\n",
      "Iteration: 118, Train loss: -0.9172, rewards: 0.6566\n",
      "Iteration: 119, Train loss: -0.8442, rewards: 0.7017\n",
      "Iteration: 120, Train loss: -1.0579, rewards: 0.6822\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6865\n",
      "------------------------------------------------------------\n",
      "Iteration: 121, Train loss: -0.8834, rewards: 0.6624\n",
      "Iteration: 122, Train loss: -0.9682, rewards: 0.7017\n",
      "Iteration: 123, Train loss: -0.8034, rewards: 0.6293\n",
      "Iteration: 124, Train loss: -0.8847, rewards: 0.6442\n",
      "Iteration: 125, Train loss: -0.8560, rewards: 0.6826\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 126, Train loss: -1.0489, rewards: 0.6740\n",
      "Iteration: 127, Train loss: -0.8564, rewards: 0.6579\n",
      "Iteration: 128, Train loss: -0.9805, rewards: 0.6355\n",
      "Iteration: 129, Train loss: -0.8037, rewards: 0.6963\n",
      "Iteration: 130, Train loss: -0.8182, rewards: 0.6045\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6959, MRR: 0.6871\n",
      "------------------------------------------------------------\n",
      "Iteration: 131, Train loss: -0.8255, rewards: 0.6318\n",
      "Iteration: 132, Train loss: -0.8262, rewards: 0.7017\n",
      "Iteration: 133, Train loss: -0.8640, rewards: 0.6269\n",
      "Iteration: 134, Train loss: -0.8390, rewards: 0.7252\n",
      "Iteration: 135, Train loss: -0.6955, rewards: 0.7554\n",
      "Iteration: 136, Train loss: -0.6316, rewards: 0.7050\n",
      "Iteration: 137, Train loss: -0.8477, rewards: 0.6434\n",
      "Iteration: 138, Train loss: -0.8743, rewards: 0.6983\n",
      "Iteration: 139, Train loss: -0.8594, rewards: 0.6174\n",
      "Iteration: 140, Train loss: -1.0347, rewards: 0.6798\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6866, Hits@10: 0.7005, MRR: 0.6856\n",
      "------------------------------------------------------------\n",
      "Iteration: 141, Train loss: -0.9154, rewards: 0.7112\n",
      "Iteration: 142, Train loss: -0.8278, rewards: 0.6537\n",
      "Iteration: 143, Train loss: -0.8753, rewards: 0.6822\n",
      "Iteration: 144, Train loss: -0.9194, rewards: 0.6983\n",
      "Iteration: 145, Train loss: -0.7709, rewards: 0.6868\n",
      "Iteration: 146, Train loss: -0.9268, rewards: 0.6661\n",
      "Iteration: 147, Train loss: -1.0103, rewards: 0.6335\n",
      "Iteration: 148, Train loss: -0.9396, rewards: 0.6289\n",
      "Iteration: 149, Train loss: -0.8496, rewards: 0.7079\n",
      "Iteration: 150, Train loss: -0.8794, rewards: 0.7062\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.6820, Hits@10: 0.6866, MRR: 0.6800\n",
      "------------------------------------------------------------\n",
      "Iteration: 151, Train loss: -0.7548, rewards: 0.6322\n",
      "Iteration: 152, Train loss: -0.8996, rewards: 0.6793\n",
      "Iteration: 153, Train loss: -1.0333, rewards: 0.6570\n",
      "Iteration: 154, Train loss: -0.7402, rewards: 0.6773\n",
      "Iteration: 155, Train loss: -1.0611, rewards: 0.6831\n",
      "Iteration: 156, Train loss: -0.8197, rewards: 0.6079\n",
      "Iteration: 157, Train loss: -0.9354, rewards: 0.5653\n",
      "Iteration: 158, Train loss: -0.7939, rewards: 0.6008\n",
      "Iteration: 159, Train loss: -1.0426, rewards: 0.6236\n",
      "Iteration: 160, Train loss: -0.8962, rewards: 0.7814\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6959, MRR: 0.6871\n",
      "------------------------------------------------------------\n",
      "Iteration: 161, Train loss: -0.9546, rewards: 0.6583\n",
      "Iteration: 162, Train loss: -0.7286, rewards: 0.6926\n",
      "Iteration: 163, Train loss: -0.7300, rewards: 0.6979\n",
      "Iteration: 164, Train loss: -0.7087, rewards: 0.6393\n",
      "Iteration: 165, Train loss: -0.8439, rewards: 0.6161\n",
      "Iteration: 166, Train loss: -0.9127, rewards: 0.6773\n",
      "Iteration: 167, Train loss: -0.8047, rewards: 0.7054\n",
      "Iteration: 168, Train loss: -0.8898, rewards: 0.6983\n",
      "Iteration: 169, Train loss: -0.9891, rewards: 0.6835\n",
      "Iteration: 170, Train loss: -0.8134, rewards: 0.6434\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6870\n",
      "------------------------------------------------------------\n",
      "Iteration: 171, Train loss: -0.8742, rewards: 0.7372\n",
      "Iteration: 172, Train loss: -0.7193, rewards: 0.6975\n",
      "Iteration: 173, Train loss: -0.9337, rewards: 0.6223\n",
      "Iteration: 174, Train loss: -0.9426, rewards: 0.7112\n",
      "Iteration: 175, Train loss: -0.7076, rewards: 0.6450\n",
      "Iteration: 176, Train loss: -0.9320, rewards: 0.6248\n",
      "Iteration: 177, Train loss: -1.0018, rewards: 0.6467\n",
      "Iteration: 178, Train loss: -0.9178, rewards: 0.6397\n",
      "Iteration: 179, Train loss: -0.8804, rewards: 0.7372\n",
      "Iteration: 180, Train loss: -0.9354, rewards: 0.6686\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6892\n",
      "------------------------------------------------------------\n",
      "Iteration: 181, Train loss: -0.8672, rewards: 0.6492\n",
      "Iteration: 182, Train loss: -0.8630, rewards: 0.7087\n",
      "Iteration: 183, Train loss: -0.8040, rewards: 0.6388\n",
      "Iteration: 184, Train loss: -0.8053, rewards: 0.6967\n",
      "Iteration: 185, Train loss: -1.0249, rewards: 0.6942\n",
      "Iteration: 186, Train loss: -0.6885, rewards: 0.6798\n",
      "Iteration: 187, Train loss: -0.8883, rewards: 0.6401\n",
      "Iteration: 188, Train loss: -0.8590, rewards: 0.6467\n",
      "Iteration: 189, Train loss: -0.8820, rewards: 0.6979\n",
      "Iteration: 190, Train loss: -0.9266, rewards: 0.6186\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6895\n",
      "------------------------------------------------------------\n",
      "Iteration: 191, Train loss: -0.8909, rewards: 0.6079\n",
      "Iteration: 192, Train loss: -0.9238, rewards: 0.6686\n",
      "Iteration: 193, Train loss: -0.8889, rewards: 0.6798\n",
      "Iteration: 194, Train loss: -0.7712, rewards: 0.7211\n",
      "Iteration: 195, Train loss: -0.8991, rewards: 0.6612\n",
      "Iteration: 196, Train loss: -0.9798, rewards: 0.6636\n",
      "Iteration: 197, Train loss: -0.8900, rewards: 0.6186\n",
      "Iteration: 198, Train loss: -0.8906, rewards: 0.6653\n",
      "Iteration: 199, Train loss: -0.9710, rewards: 0.6674\n",
      "Iteration: 200, Train loss: -0.8910, rewards: 0.7376\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6869\n",
      "------------------------------------------------------------\n",
      "Iteration: 201, Train loss: -1.0471, rewards: 0.6302\n",
      "Iteration: 202, Train loss: -0.4574, rewards: 0.7752\n",
      "Iteration: 203, Train loss: -0.7684, rewards: 0.7512\n",
      "Iteration: 204, Train loss: -0.8770, rewards: 0.6467\n",
      "Iteration: 205, Train loss: -0.9166, rewards: 0.6149\n",
      "Iteration: 206, Train loss: -0.7891, rewards: 0.6479\n",
      "Iteration: 207, Train loss: -0.9069, rewards: 0.7248\n",
      "Iteration: 208, Train loss: -0.8884, rewards: 0.6380\n",
      "Iteration: 209, Train loss: -0.9808, rewards: 0.6248\n",
      "Iteration: 210, Train loss: -0.8516, rewards: 0.6698\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6870\n",
      "------------------------------------------------------------\n",
      "Iteration: 211, Train loss: -0.8690, rewards: 0.6789\n",
      "Iteration: 212, Train loss: -0.7733, rewards: 0.6674\n",
      "Iteration: 213, Train loss: -0.7447, rewards: 0.7260\n",
      "Iteration: 214, Train loss: -0.8764, rewards: 0.7165\n",
      "Iteration: 215, Train loss: -0.9480, rewards: 0.6335\n",
      "Iteration: 216, Train loss: -0.7589, rewards: 0.7029\n",
      "Iteration: 217, Train loss: -0.8573, rewards: 0.6587\n",
      "Iteration: 218, Train loss: -0.8591, rewards: 0.6240\n",
      "Iteration: 219, Train loss: -0.8570, rewards: 0.6624\n",
      "Iteration: 220, Train loss: -0.9466, rewards: 0.6636\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6868\n",
      "------------------------------------------------------------\n",
      "Iteration: 221, Train loss: -0.7614, rewards: 0.7244\n",
      "Iteration: 222, Train loss: -0.6837, rewards: 0.7450\n",
      "Iteration: 223, Train loss: -0.8575, rewards: 0.6674\n",
      "Iteration: 224, Train loss: -0.6398, rewards: 0.6781\n",
      "Iteration: 225, Train loss: -0.9461, rewards: 0.7066\n",
      "Iteration: 226, Train loss: -0.7616, rewards: 0.7021\n",
      "Iteration: 227, Train loss: -0.7683, rewards: 0.7012\n",
      "Iteration: 228, Train loss: -0.8140, rewards: 0.6632\n",
      "Iteration: 229, Train loss: -0.8045, rewards: 0.7306\n",
      "Iteration: 230, Train loss: -0.9136, rewards: 0.7463\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6866\n",
      "------------------------------------------------------------\n",
      "Iteration: 231, Train loss: -0.9449, rewards: 0.5657\n",
      "Iteration: 232, Train loss: -0.7125, rewards: 0.7169\n",
      "Iteration: 233, Train loss: -0.8553, rewards: 0.7161\n",
      "Iteration: 234, Train loss: -0.8456, rewards: 0.7186\n",
      "Iteration: 235, Train loss: -0.9722, rewards: 0.6814\n",
      "Iteration: 236, Train loss: -0.6374, rewards: 0.6996\n",
      "Iteration: 237, Train loss: -1.1068, rewards: 0.6686\n",
      "Iteration: 238, Train loss: -0.8626, rewards: 0.6888\n",
      "Iteration: 239, Train loss: -0.8950, rewards: 0.6512\n",
      "Iteration: 240, Train loss: -1.0716, rewards: 0.6521\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6867\n",
      "------------------------------------------------------------\n",
      "Iteration: 241, Train loss: -0.9599, rewards: 0.6459\n",
      "Iteration: 242, Train loss: -0.7244, rewards: 0.7273\n",
      "Iteration: 243, Train loss: -0.9967, rewards: 0.6446\n",
      "Iteration: 244, Train loss: -0.9200, rewards: 0.6368\n",
      "Iteration: 245, Train loss: -0.9784, rewards: 0.6963\n",
      "Iteration: 246, Train loss: -0.7058, rewards: 0.7190\n",
      "Iteration: 247, Train loss: -1.0778, rewards: 0.6612\n",
      "Iteration: 248, Train loss: -0.8770, rewards: 0.6702\n",
      "Iteration: 249, Train loss: -0.9687, rewards: 0.6880\n",
      "Iteration: 250, Train loss: -0.7115, rewards: 0.6851\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6868\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 251, Train loss: -0.7534, rewards: 0.6917\n",
      "Iteration: 252, Train loss: -0.9054, rewards: 0.6963\n",
      "Iteration: 253, Train loss: -0.8814, rewards: 0.7306\n",
      "Iteration: 254, Train loss: -0.8838, rewards: 0.6223\n",
      "Iteration: 255, Train loss: -0.9556, rewards: 0.6190\n",
      "Iteration: 256, Train loss: -0.9171, rewards: 0.6186\n",
      "Iteration: 257, Train loss: -0.8376, rewards: 0.6244\n",
      "Iteration: 258, Train loss: -0.8651, rewards: 0.6930\n",
      "Iteration: 259, Train loss: -0.7971, rewards: 0.6620\n",
      "Iteration: 260, Train loss: -0.8547, rewards: 0.6277\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6820, Hits@10: 0.6912, MRR: 0.6831\n",
      "------------------------------------------------------------\n",
      "Iteration: 261, Train loss: -0.8404, rewards: 0.6649\n",
      "Iteration: 262, Train loss: -0.9669, rewards: 0.6554\n",
      "Iteration: 263, Train loss: -0.8359, rewards: 0.6496\n",
      "Iteration: 264, Train loss: -0.8276, rewards: 0.6731\n",
      "Iteration: 265, Train loss: -0.9836, rewards: 0.6934\n",
      "Iteration: 266, Train loss: -0.8400, rewards: 0.6921\n",
      "Iteration: 267, Train loss: -0.9119, rewards: 0.7099\n",
      "Iteration: 268, Train loss: -0.6787, rewards: 0.6376\n",
      "Iteration: 269, Train loss: -0.8203, rewards: 0.7120\n",
      "Iteration: 270, Train loss: -0.9177, rewards: 0.6988\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6872\n",
      "------------------------------------------------------------\n",
      "Iteration: 271, Train loss: -0.9798, rewards: 0.6616\n",
      "Iteration: 272, Train loss: -0.8039, rewards: 0.7169\n",
      "Iteration: 273, Train loss: -0.9984, rewards: 0.7169\n",
      "Iteration: 274, Train loss: -0.8826, rewards: 0.6566\n",
      "Iteration: 275, Train loss: -0.7980, rewards: 0.6231\n",
      "Iteration: 276, Train loss: -0.8027, rewards: 0.6331\n",
      "Iteration: 277, Train loss: -0.8848, rewards: 0.6360\n",
      "Iteration: 278, Train loss: -0.8682, rewards: 0.6640\n",
      "Iteration: 279, Train loss: -0.8760, rewards: 0.6810\n",
      "Iteration: 280, Train loss: -0.8111, rewards: 0.6855\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6845\n",
      "------------------------------------------------------------\n",
      "Iteration: 281, Train loss: -0.8997, rewards: 0.6616\n",
      "Iteration: 282, Train loss: -0.8112, rewards: 0.6810\n",
      "Iteration: 283, Train loss: -0.8648, rewards: 0.6145\n",
      "Iteration: 284, Train loss: -0.7465, rewards: 0.6942\n",
      "Iteration: 285, Train loss: -1.0284, rewards: 0.6864\n",
      "Iteration: 286, Train loss: -0.8919, rewards: 0.6785\n",
      "Iteration: 287, Train loss: -0.8068, rewards: 0.6744\n",
      "Iteration: 288, Train loss: -0.8742, rewards: 0.6393\n",
      "Iteration: 289, Train loss: -0.7192, rewards: 0.6975\n",
      "Iteration: 290, Train loss: -0.6591, rewards: 0.7153\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6862\n",
      "------------------------------------------------------------\n",
      "Iteration: 291, Train loss: -0.7886, rewards: 0.6921\n",
      "Iteration: 292, Train loss: -0.6417, rewards: 0.7570\n",
      "Iteration: 293, Train loss: -0.7659, rewards: 0.6314\n",
      "Iteration: 294, Train loss: -0.8088, rewards: 0.6868\n",
      "Iteration: 295, Train loss: -0.8870, rewards: 0.6169\n",
      "Iteration: 296, Train loss: -0.8047, rewards: 0.7306\n",
      "Iteration: 297, Train loss: -1.0013, rewards: 0.6839\n",
      "Iteration: 298, Train loss: -0.8474, rewards: 0.5789\n",
      "Iteration: 299, Train loss: -0.7542, rewards: 0.7045\n",
      "Iteration: 300, Train loss: -0.8130, rewards: 0.7269\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6959, MRR: 0.6870\n",
      "------------------------------------------------------------\n",
      "Iteration: 301, Train loss: -0.8266, rewards: 0.7591\n",
      "Iteration: 302, Train loss: -0.7684, rewards: 0.6769\n",
      "Iteration: 303, Train loss: -0.9765, rewards: 0.6723\n",
      "Iteration: 304, Train loss: -0.9125, rewards: 0.7050\n",
      "Iteration: 305, Train loss: -0.8645, rewards: 0.7566\n",
      "Iteration: 306, Train loss: -0.8616, rewards: 0.6872\n",
      "Iteration: 307, Train loss: -0.8774, rewards: 0.6756\n",
      "Iteration: 308, Train loss: -0.8759, rewards: 0.6533\n",
      "Iteration: 309, Train loss: -0.8717, rewards: 0.6620\n",
      "Iteration: 310, Train loss: -0.7428, rewards: 0.7545\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6892\n",
      "------------------------------------------------------------\n",
      "Iteration: 311, Train loss: -0.9357, rewards: 0.6157\n",
      "Iteration: 312, Train loss: -0.8722, rewards: 0.7128\n",
      "Iteration: 313, Train loss: -1.0132, rewards: 0.6570\n",
      "Iteration: 314, Train loss: -0.9514, rewards: 0.6727\n",
      "Iteration: 315, Train loss: -0.8208, rewards: 0.7025\n",
      "Iteration: 316, Train loss: -0.9178, rewards: 0.7281\n",
      "Iteration: 317, Train loss: -1.0191, rewards: 0.6529\n",
      "Iteration: 318, Train loss: -0.8725, rewards: 0.6909\n",
      "Iteration: 319, Train loss: -0.8083, rewards: 0.6897\n",
      "Iteration: 320, Train loss: -0.7939, rewards: 0.6554\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6888\n",
      "------------------------------------------------------------\n",
      "Iteration: 321, Train loss: -0.8256, rewards: 0.6955\n",
      "Iteration: 322, Train loss: -0.6195, rewards: 0.6740\n",
      "Iteration: 323, Train loss: -0.5353, rewards: 0.7802\n",
      "Iteration: 324, Train loss: -0.9266, rewards: 0.6686\n",
      "Iteration: 325, Train loss: -0.9437, rewards: 0.5926\n",
      "Iteration: 326, Train loss: -0.9427, rewards: 0.6835\n",
      "Iteration: 327, Train loss: -0.7279, rewards: 0.7120\n",
      "Iteration: 328, Train loss: -0.9729, rewards: 0.6607\n",
      "Iteration: 329, Train loss: -0.8368, rewards: 0.6814\n",
      "Iteration: 330, Train loss: -1.0689, rewards: 0.5950\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6892\n",
      "------------------------------------------------------------\n",
      "Iteration: 331, Train loss: -0.9287, rewards: 0.6864\n",
      "Iteration: 332, Train loss: -0.8231, rewards: 0.6736\n",
      "Iteration: 333, Train loss: -0.7123, rewards: 0.7017\n",
      "Iteration: 334, Train loss: -0.8054, rewards: 0.7351\n",
      "Iteration: 335, Train loss: -0.8317, rewards: 0.7388\n",
      "Iteration: 336, Train loss: -0.8918, rewards: 0.6227\n",
      "Iteration: 337, Train loss: -0.8328, rewards: 0.7669\n",
      "Iteration: 338, Train loss: -0.7817, rewards: 0.6591\n",
      "Iteration: 339, Train loss: -0.7981, rewards: 0.6748\n",
      "Iteration: 340, Train loss: -0.8257, rewards: 0.7587\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6892\n",
      "------------------------------------------------------------\n",
      "Iteration: 341, Train loss: -0.8042, rewards: 0.6099\n",
      "Iteration: 342, Train loss: -0.9072, rewards: 0.6946\n",
      "Iteration: 343, Train loss: -1.0456, rewards: 0.6314\n",
      "Iteration: 344, Train loss: -0.9248, rewards: 0.5926\n",
      "Iteration: 345, Train loss: -0.6571, rewards: 0.7380\n",
      "Iteration: 346, Train loss: -0.8522, rewards: 0.6760\n",
      "Iteration: 347, Train loss: -0.7250, rewards: 0.7293\n",
      "Iteration: 348, Train loss: -0.9272, rewards: 0.7099\n",
      "Iteration: 349, Train loss: -0.7577, rewards: 0.7380\n",
      "Iteration: 350, Train loss: -0.6644, rewards: 0.6917\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6867\n",
      "------------------------------------------------------------\n",
      "Iteration: 351, Train loss: -0.8093, rewards: 0.6789\n",
      "Iteration: 352, Train loss: -0.8986, rewards: 0.6694\n",
      "Iteration: 353, Train loss: -0.6710, rewards: 0.7132\n",
      "Iteration: 354, Train loss: -0.7484, rewards: 0.6822\n",
      "Iteration: 355, Train loss: -0.9545, rewards: 0.6723\n",
      "Iteration: 356, Train loss: -0.9715, rewards: 0.7273\n",
      "Iteration: 357, Train loss: -0.8252, rewards: 0.6826\n",
      "Iteration: 358, Train loss: -0.9992, rewards: 0.6223\n",
      "Iteration: 359, Train loss: -0.7552, rewards: 0.7194\n",
      "Iteration: 360, Train loss: -0.8207, rewards: 0.6938\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6883\n",
      "------------------------------------------------------------\n",
      "Iteration: 361, Train loss: -0.6751, rewards: 0.6884\n",
      "Iteration: 362, Train loss: -0.9728, rewards: 0.7236\n",
      "Iteration: 363, Train loss: -0.8463, rewards: 0.6938\n",
      "Iteration: 364, Train loss: -0.9300, rewards: 0.6500\n",
      "Iteration: 365, Train loss: -0.8824, rewards: 0.7128\n",
      "Iteration: 366, Train loss: -0.7509, rewards: 0.6731\n",
      "Iteration: 367, Train loss: -0.9276, rewards: 0.6740\n",
      "Iteration: 368, Train loss: -0.9347, rewards: 0.6674\n",
      "Iteration: 369, Train loss: -0.8136, rewards: 0.6707\n",
      "Iteration: 370, Train loss: -0.9939, rewards: 0.5756\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.6912, MRR: 0.6875\n",
      "------------------------------------------------------------\n",
      "Iteration: 371, Train loss: -0.9595, rewards: 0.6802\n",
      "Iteration: 372, Train loss: -0.9614, rewards: 0.6397\n",
      "Iteration: 373, Train loss: -1.0574, rewards: 0.6802\n",
      "Iteration: 374, Train loss: -0.7729, rewards: 0.7360\n",
      "Iteration: 375, Train loss: -0.7749, rewards: 0.6467\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 376, Train loss: -0.9281, rewards: 0.7397\n",
      "Iteration: 377, Train loss: -0.9615, rewards: 0.7029\n",
      "Iteration: 378, Train loss: -0.8319, rewards: 0.5988\n",
      "Iteration: 379, Train loss: -0.7860, rewards: 0.6264\n",
      "Iteration: 380, Train loss: -0.8787, rewards: 0.6570\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6896\n",
      "------------------------------------------------------------\n",
      "Iteration: 381, Train loss: -0.9580, rewards: 0.7029\n",
      "Iteration: 382, Train loss: -0.9177, rewards: 0.7260\n",
      "Iteration: 383, Train loss: -0.7847, rewards: 0.6946\n",
      "Iteration: 384, Train loss: -0.8691, rewards: 0.7285\n",
      "Iteration: 385, Train loss: -1.0550, rewards: 0.6393\n",
      "Iteration: 386, Train loss: -0.7348, rewards: 0.6736\n",
      "Iteration: 387, Train loss: -0.7344, rewards: 0.6731\n",
      "Iteration: 388, Train loss: -0.9171, rewards: 0.6219\n",
      "Iteration: 389, Train loss: -0.9919, rewards: 0.6822\n",
      "Iteration: 390, Train loss: -0.9276, rewards: 0.6174\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.7005, MRR: 0.6896\n",
      "------------------------------------------------------------\n",
      "Iteration: 391, Train loss: -0.7926, rewards: 0.6533\n",
      "Iteration: 392, Train loss: -0.9060, rewards: 0.6583\n",
      "Iteration: 393, Train loss: -0.9560, rewards: 0.6909\n",
      "Iteration: 394, Train loss: -0.7821, rewards: 0.7421\n",
      "Iteration: 395, Train loss: -0.7722, rewards: 0.6674\n",
      "Iteration: 396, Train loss: -0.9323, rewards: 0.6905\n",
      "Iteration: 397, Train loss: -0.9594, rewards: 0.6248\n",
      "Iteration: 398, Train loss: -0.8783, rewards: 0.6355\n",
      "Iteration: 399, Train loss: -0.9313, rewards: 0.6727\n",
      "Iteration: 400, Train loss: -0.9300, rewards: 0.6959\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.6912, Hits@10: 0.7005, MRR: 0.6942\n",
      "------------------------------------------------------------\n",
      "Iteration: 401, Train loss: -0.9918, rewards: 0.6355\n",
      "Iteration: 402, Train loss: -0.8836, rewards: 0.6413\n",
      "Iteration: 403, Train loss: -0.8095, rewards: 0.6500\n",
      "Iteration: 404, Train loss: -0.9709, rewards: 0.6558\n",
      "Iteration: 405, Train loss: -1.0157, rewards: 0.6496\n",
      "Iteration: 406, Train loss: -0.8487, rewards: 0.6835\n",
      "Iteration: 407, Train loss: -0.9103, rewards: 0.7169\n",
      "Iteration: 408, Train loss: -0.9516, rewards: 0.7599\n",
      "Iteration: 409, Train loss: -0.6313, rewards: 0.7198\n",
      "Iteration: 410, Train loss: -0.8189, rewards: 0.6347\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6919\n",
      "------------------------------------------------------------\n",
      "Iteration: 411, Train loss: -0.8048, rewards: 0.7070\n",
      "Iteration: 412, Train loss: -0.8159, rewards: 0.7124\n",
      "Iteration: 413, Train loss: -0.8415, rewards: 0.6711\n",
      "Iteration: 414, Train loss: -1.0994, rewards: 0.6574\n",
      "Iteration: 415, Train loss: -1.0325, rewards: 0.6128\n",
      "Iteration: 416, Train loss: -0.7456, rewards: 0.7298\n",
      "Iteration: 417, Train loss: -0.8090, rewards: 0.6558\n",
      "Iteration: 418, Train loss: -0.7816, rewards: 0.7149\n",
      "Iteration: 419, Train loss: -1.0081, rewards: 0.7000\n",
      "Iteration: 420, Train loss: -0.9740, rewards: 0.7136\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6912, Hits@10: 0.7051, MRR: 0.6918\n",
      "------------------------------------------------------------\n",
      "Iteration: 421, Train loss: -0.8167, rewards: 0.6624\n",
      "Iteration: 422, Train loss: -0.8875, rewards: 0.6847\n",
      "Iteration: 423, Train loss: -0.7518, rewards: 0.6897\n",
      "Iteration: 424, Train loss: -0.8932, rewards: 0.6669\n",
      "Iteration: 425, Train loss: -0.7900, rewards: 0.6215\n",
      "Iteration: 426, Train loss: -0.7303, rewards: 0.6661\n",
      "Iteration: 427, Train loss: -1.1484, rewards: 0.6190\n",
      "Iteration: 428, Train loss: -0.9645, rewards: 0.6669\n",
      "Iteration: 429, Train loss: -0.8303, rewards: 0.7298\n",
      "Iteration: 430, Train loss: -0.8548, rewards: 0.7302\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6918\n",
      "------------------------------------------------------------\n",
      "Iteration: 431, Train loss: -0.7360, rewards: 0.6579\n",
      "Iteration: 432, Train loss: -0.8312, rewards: 0.7145\n",
      "Iteration: 433, Train loss: -1.0751, rewards: 0.6971\n",
      "Iteration: 434, Train loss: -1.0286, rewards: 0.7054\n",
      "Iteration: 435, Train loss: -0.9815, rewards: 0.6318\n",
      "Iteration: 436, Train loss: -0.8859, rewards: 0.6934\n",
      "Iteration: 437, Train loss: -0.9199, rewards: 0.7273\n",
      "Iteration: 438, Train loss: -0.8676, rewards: 0.6988\n",
      "Iteration: 439, Train loss: -0.9314, rewards: 0.6893\n",
      "Iteration: 440, Train loss: -0.8985, rewards: 0.6669\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6894\n",
      "------------------------------------------------------------\n",
      "Iteration: 441, Train loss: -0.5588, rewards: 0.7488\n",
      "Iteration: 442, Train loss: -0.7721, rewards: 0.6467\n",
      "Iteration: 443, Train loss: -0.9310, rewards: 0.8190\n",
      "Iteration: 444, Train loss: -0.8190, rewards: 0.6153\n",
      "Iteration: 445, Train loss: -0.6091, rewards: 0.7640\n",
      "Iteration: 446, Train loss: -0.8084, rewards: 0.7215\n",
      "Iteration: 447, Train loss: -0.7818, rewards: 0.7483\n",
      "Iteration: 448, Train loss: -0.7987, rewards: 0.7054\n",
      "Iteration: 449, Train loss: -0.9090, rewards: 0.6331\n",
      "Iteration: 450, Train loss: -0.9698, rewards: 0.6719\n",
      "Eval:\n",
      "Hits@1: 0.6682, Hits@3: 0.6912, Hits@10: 0.7051, MRR: 0.6829\n",
      "------------------------------------------------------------\n",
      "Iteration: 451, Train loss: -0.7234, rewards: 0.6285\n",
      "Iteration: 452, Train loss: -0.8022, rewards: 0.6955\n",
      "Iteration: 453, Train loss: -0.9214, rewards: 0.6360\n",
      "Iteration: 454, Train loss: -0.6433, rewards: 0.6748\n",
      "Iteration: 455, Train loss: -0.9380, rewards: 0.7376\n",
      "Iteration: 456, Train loss: -0.9586, rewards: 0.5574\n",
      "Iteration: 457, Train loss: -0.8116, rewards: 0.7876\n",
      "Iteration: 458, Train loss: -0.9711, rewards: 0.6802\n",
      "Iteration: 459, Train loss: -0.8371, rewards: 0.7079\n",
      "Iteration: 460, Train loss: -0.8454, rewards: 0.6450\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6895\n",
      "------------------------------------------------------------\n",
      "Iteration: 461, Train loss: -0.7849, rewards: 0.6917\n",
      "Iteration: 462, Train loss: -0.5679, rewards: 0.8124\n",
      "Iteration: 463, Train loss: -0.9376, rewards: 0.6727\n",
      "Iteration: 464, Train loss: -0.9864, rewards: 0.7103\n",
      "Iteration: 465, Train loss: -0.7651, rewards: 0.7070\n",
      "Iteration: 466, Train loss: -0.8284, rewards: 0.6525\n",
      "Iteration: 467, Train loss: -0.8685, rewards: 0.7219\n",
      "Iteration: 468, Train loss: -0.9825, rewards: 0.6835\n",
      "Iteration: 469, Train loss: -0.9020, rewards: 0.6661\n",
      "Iteration: 470, Train loss: -0.7249, rewards: 0.6566\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6895\n",
      "------------------------------------------------------------\n",
      "Iteration: 471, Train loss: -0.8351, rewards: 0.7207\n",
      "Iteration: 472, Train loss: -1.0347, rewards: 0.6442\n",
      "Iteration: 473, Train loss: -0.6960, rewards: 0.7471\n",
      "Iteration: 474, Train loss: -0.8789, rewards: 0.7157\n",
      "Iteration: 475, Train loss: -0.7554, rewards: 0.7045\n",
      "Iteration: 476, Train loss: -0.8270, rewards: 0.7041\n",
      "Iteration: 477, Train loss: -0.6857, rewards: 0.6860\n",
      "Iteration: 478, Train loss: -0.8665, rewards: 0.6802\n",
      "Iteration: 479, Train loss: -0.7676, rewards: 0.6351\n",
      "Iteration: 480, Train loss: -0.7940, rewards: 0.6798\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6874\n",
      "------------------------------------------------------------\n",
      "Iteration: 481, Train loss: -0.7543, rewards: 0.7054\n",
      "Iteration: 482, Train loss: -0.7203, rewards: 0.7318\n",
      "Iteration: 483, Train loss: -0.9061, rewards: 0.6430\n",
      "Iteration: 484, Train loss: -0.9888, rewards: 0.6702\n",
      "Iteration: 485, Train loss: -0.7297, rewards: 0.6731\n",
      "Iteration: 486, Train loss: -0.9075, rewards: 0.6293\n",
      "Iteration: 487, Train loss: -0.7791, rewards: 0.7409\n",
      "Iteration: 488, Train loss: -0.8515, rewards: 0.6888\n",
      "Iteration: 489, Train loss: -0.8208, rewards: 0.6868\n",
      "Iteration: 490, Train loss: -0.7573, rewards: 0.7471\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6892\n",
      "------------------------------------------------------------\n",
      "Iteration: 491, Train loss: -0.6676, rewards: 0.6971\n",
      "Iteration: 492, Train loss: -0.7527, rewards: 0.7355\n",
      "Iteration: 493, Train loss: -0.9336, rewards: 0.7033\n",
      "Iteration: 494, Train loss: -0.9428, rewards: 0.6252\n",
      "Iteration: 495, Train loss: -1.0033, rewards: 0.6372\n",
      "Iteration: 496, Train loss: -0.6618, rewards: 0.7054\n",
      "Iteration: 497, Train loss: -0.7710, rewards: 0.7355\n",
      "Iteration: 498, Train loss: -0.9235, rewards: 0.6562\n",
      "Iteration: 499, Train loss: -0.7473, rewards: 0.6653\n",
      "Iteration: 500, Train loss: -0.8038, rewards: 0.7157\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6914\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 501, Train loss: -0.8710, rewards: 0.6847\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personleadsorganization//test_beam/ ]\n",
      "Hits@1: 0.6336, Hits@3: 0.7500, Hits@10: 0.7802, MRR: 0.6946\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8691002909875059 (179 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:33:13,304]\u001b[0m Trial 0 finished with value: 0.8691002909875059 and parameters: {'lr': 0.00036524588657273476, 'bs': 121, 'b': 0.2087320666461685, 'l': 0.47843261291780187, 'ee': 10}. Best is trial 0 with value: 0.8691002909875059.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.8853, rewards: 0.2835\n",
      "Iteration: 10, Train loss: -0.9946, rewards: 0.2954\n",
      "Iteration: 15, Train loss: -1.1060, rewards: 0.2827\n",
      "Iteration: 20, Train loss: -1.0525, rewards: 0.3231\n",
      "Iteration: 25, Train loss: -1.1203, rewards: 0.4169\n",
      "Iteration: 30, Train loss: -1.0747, rewards: 0.4219\n",
      "Iteration: 35, Train loss: -1.2661, rewards: 0.3938\n",
      "Iteration: 40, Train loss: -1.1480, rewards: 0.3927\n",
      "Iteration: 45, Train loss: -1.0650, rewards: 0.4335\n",
      "Iteration: 50, Train loss: -1.0975, rewards: 0.4785\n",
      "Eval:\n",
      "Hits@1: 0.5991, Hits@3: 0.6544, Hits@10: 0.6959, MRR: 0.6287\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -1.2223, rewards: 0.4235\n",
      "Iteration: 60, Train loss: -1.2034, rewards: 0.5369\n",
      "Iteration: 65, Train loss: -1.1589, rewards: 0.5212\n",
      "Iteration: 70, Train loss: -1.1466, rewards: 0.4808\n",
      "Iteration: 75, Train loss: -0.9740, rewards: 0.5377\n",
      "Iteration: 80, Train loss: -1.1236, rewards: 0.3588\n",
      "Iteration: 85, Train loss: -1.0512, rewards: 0.5423\n",
      "Iteration: 90, Train loss: -1.1876, rewards: 0.4688\n",
      "Iteration: 95, Train loss: -1.1756, rewards: 0.4765\n",
      "Iteration: 100, Train loss: -1.1560, rewards: 0.4550\n",
      "Eval:\n",
      "Hits@1: 0.5853, Hits@3: 0.6636, Hits@10: 0.7051, MRR: 0.6279\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -1.0858, rewards: 0.4669\n",
      "Iteration: 110, Train loss: -1.1700, rewards: 0.5585\n",
      "Iteration: 115, Train loss: -1.1906, rewards: 0.5585\n",
      "Iteration: 120, Train loss: -1.1860, rewards: 0.5500\n",
      "Iteration: 125, Train loss: -1.1043, rewards: 0.4850\n",
      "Iteration: 130, Train loss: -1.1866, rewards: 0.4919\n",
      "Iteration: 135, Train loss: -1.1499, rewards: 0.5819\n",
      "Iteration: 140, Train loss: -1.1682, rewards: 0.5981\n",
      "Iteration: 145, Train loss: -1.2476, rewards: 0.4542\n",
      "Iteration: 150, Train loss: -1.1197, rewards: 0.5746\n",
      "Eval:\n",
      "Hits@1: 0.6313, Hits@3: 0.6774, Hits@10: 0.7143, MRR: 0.6573\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -1.2391, rewards: 0.5292\n",
      "Iteration: 160, Train loss: -1.1204, rewards: 0.5350\n",
      "Iteration: 165, Train loss: -1.0624, rewards: 0.5892\n",
      "Iteration: 170, Train loss: -1.1380, rewards: 0.5327\n",
      "Iteration: 175, Train loss: -1.1981, rewards: 0.4500\n",
      "Iteration: 180, Train loss: -1.1244, rewards: 0.5912\n",
      "Iteration: 185, Train loss: -1.1916, rewards: 0.5885\n",
      "Iteration: 190, Train loss: -1.1933, rewards: 0.5496\n",
      "Iteration: 195, Train loss: -1.2683, rewards: 0.6158\n",
      "Iteration: 200, Train loss: -1.1028, rewards: 0.6373\n",
      "Eval:\n",
      "Hits@1: 0.6129, Hits@3: 0.6728, Hits@10: 0.6959, MRR: 0.6453\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -1.2345, rewards: 0.5088\n",
      "Iteration: 210, Train loss: -1.2466, rewards: 0.5173\n",
      "Iteration: 215, Train loss: -1.2608, rewards: 0.5004\n",
      "Iteration: 220, Train loss: -1.0617, rewards: 0.5562\n",
      "Iteration: 225, Train loss: -1.1835, rewards: 0.5404\n",
      "Iteration: 230, Train loss: -1.1949, rewards: 0.5596\n",
      "Iteration: 235, Train loss: -1.1761, rewards: 0.6015\n",
      "Iteration: 240, Train loss: -1.0525, rewards: 0.5892\n",
      "Iteration: 245, Train loss: -1.3624, rewards: 0.4846\n",
      "Iteration: 250, Train loss: -1.2475, rewards: 0.6135\n",
      "Eval:\n",
      "Hits@1: 0.6452, Hits@3: 0.6820, Hits@10: 0.7189, MRR: 0.6678\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.9868, rewards: 0.6204\n",
      "Iteration: 260, Train loss: -1.3063, rewards: 0.5446\n",
      "Iteration: 265, Train loss: -1.1189, rewards: 0.5869\n",
      "Iteration: 270, Train loss: -1.1477, rewards: 0.6696\n",
      "Iteration: 275, Train loss: -1.2083, rewards: 0.5796\n",
      "Iteration: 280, Train loss: -1.1158, rewards: 0.5250\n",
      "Iteration: 285, Train loss: -1.1856, rewards: 0.5331\n",
      "Iteration: 290, Train loss: -1.1621, rewards: 0.6050\n",
      "Iteration: 295, Train loss: -1.1908, rewards: 0.5746\n",
      "Iteration: 300, Train loss: -1.2385, rewards: 0.5192\n",
      "Eval:\n",
      "Hits@1: 0.6452, Hits@3: 0.6774, Hits@10: 0.7005, MRR: 0.6633\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -1.3078, rewards: 0.5281\n",
      "Iteration: 310, Train loss: -1.2474, rewards: 0.5127\n",
      "Iteration: 315, Train loss: -1.1137, rewards: 0.6015\n",
      "Iteration: 320, Train loss: -1.2522, rewards: 0.5773\n",
      "Iteration: 325, Train loss: -1.1063, rewards: 0.6127\n",
      "Iteration: 330, Train loss: -1.3212, rewards: 0.5477\n",
      "Iteration: 335, Train loss: -1.2883, rewards: 0.5696\n",
      "Iteration: 340, Train loss: -1.1021, rewards: 0.5465\n",
      "Iteration: 345, Train loss: -1.2938, rewards: 0.5400\n",
      "Iteration: 350, Train loss: -1.2931, rewards: 0.5169\n",
      "Eval:\n",
      "Hits@1: 0.6406, Hits@3: 0.6774, Hits@10: 0.7143, MRR: 0.6630\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -1.2316, rewards: 0.5635\n",
      "Iteration: 360, Train loss: -1.1755, rewards: 0.5912\n",
      "Iteration: 365, Train loss: -1.1792, rewards: 0.5092\n",
      "Iteration: 370, Train loss: -1.1854, rewards: 0.5681\n",
      "Iteration: 375, Train loss: -1.2019, rewards: 0.5827\n",
      "Iteration: 380, Train loss: -1.2869, rewards: 0.6242\n",
      "Iteration: 385, Train loss: -1.3200, rewards: 0.5631\n",
      "Iteration: 390, Train loss: -1.1654, rewards: 0.5185\n",
      "Iteration: 395, Train loss: -1.1092, rewards: 0.6019\n",
      "Iteration: 400, Train loss: -1.2398, rewards: 0.6242\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.6820, Hits@10: 0.7143, MRR: 0.6769\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -1.3911, rewards: 0.5665\n",
      "Iteration: 410, Train loss: -1.1517, rewards: 0.6065\n",
      "Iteration: 415, Train loss: -1.3501, rewards: 0.5531\n",
      "Iteration: 420, Train loss: -1.1897, rewards: 0.5996\n",
      "Iteration: 425, Train loss: -1.3477, rewards: 0.4881\n",
      "Iteration: 430, Train loss: -1.2543, rewards: 0.6123\n",
      "Iteration: 435, Train loss: -1.2300, rewards: 0.6365\n",
      "Iteration: 440, Train loss: -1.2643, rewards: 0.5662\n",
      "Iteration: 445, Train loss: -1.1283, rewards: 0.6035\n",
      "Iteration: 450, Train loss: -1.2001, rewards: 0.6204\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.6774, Hits@10: 0.7051, MRR: 0.6746\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -1.1582, rewards: 0.6085\n",
      "Iteration: 460, Train loss: -1.2890, rewards: 0.6215\n",
      "Iteration: 465, Train loss: -1.0493, rewards: 0.6000\n",
      "Iteration: 470, Train loss: -1.1232, rewards: 0.6023\n",
      "Iteration: 475, Train loss: -1.2818, rewards: 0.5665\n",
      "Iteration: 480, Train loss: -1.2540, rewards: 0.6573\n",
      "Iteration: 485, Train loss: -1.1863, rewards: 0.6119\n",
      "Iteration: 490, Train loss: -1.1483, rewards: 0.6469\n",
      "Iteration: 495, Train loss: -1.2873, rewards: 0.6146\n",
      "Iteration: 500, Train loss: -1.1287, rewards: 0.6131\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6728, Hits@10: 0.7097, MRR: 0.6697\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -1.2324, rewards: 0.5104\n",
      "Iteration: 510, Train loss: -1.1791, rewards: 0.6277\n",
      "Iteration: 515, Train loss: -1.3010, rewards: 0.5892\n",
      "Iteration: 520, Train loss: -1.1551, rewards: 0.6396\n",
      "Iteration: 525, Train loss: -1.2721, rewards: 0.5723\n",
      "Iteration: 530, Train loss: -1.2532, rewards: 0.6154\n",
      "Iteration: 535, Train loss: -1.2890, rewards: 0.6777\n",
      "Iteration: 540, Train loss: -1.1115, rewards: 0.6058\n",
      "Iteration: 545, Train loss: -1.2798, rewards: 0.6588\n",
      "Iteration: 550, Train loss: -1.2088, rewards: 0.5985\n",
      "Eval:\n",
      "Hits@1: 0.6359, Hits@3: 0.6728, Hits@10: 0.7097, MRR: 0.6611\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -1.0660, rewards: 0.6600\n",
      "Iteration: 560, Train loss: -1.4452, rewards: 0.5362\n",
      "Iteration: 565, Train loss: -1.1979, rewards: 0.5665\n",
      "Iteration: 570, Train loss: -1.3937, rewards: 0.5681\n",
      "Iteration: 575, Train loss: -1.0947, rewards: 0.6527\n",
      "Iteration: 580, Train loss: -1.2879, rewards: 0.6527\n",
      "Iteration: 585, Train loss: -1.1285, rewards: 0.5373\n",
      "Iteration: 590, Train loss: -1.3201, rewards: 0.5608\n",
      "Iteration: 595, Train loss: -1.1039, rewards: 0.6296\n",
      "Iteration: 600, Train loss: -1.2360, rewards: 0.6373\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6774, Hits@10: 0.7097, MRR: 0.6697\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -1.3075, rewards: 0.5588\n",
      "Iteration: 610, Train loss: -1.3377, rewards: 0.6062\n",
      "Iteration: 615, Train loss: -1.1760, rewards: 0.5981\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -1.1737, rewards: 0.6142\n",
      "Iteration: 625, Train loss: -1.0552, rewards: 0.5781\n",
      "Iteration: 630, Train loss: -1.0957, rewards: 0.6185\n",
      "Iteration: 635, Train loss: -1.0490, rewards: 0.4954\n",
      "Iteration: 640, Train loss: -1.2620, rewards: 0.5123\n",
      "Iteration: 645, Train loss: -1.0580, rewards: 0.6677\n",
      "Iteration: 650, Train loss: -1.3737, rewards: 0.5796\n",
      "Eval:\n",
      "Hits@1: 0.6452, Hits@3: 0.6866, Hits@10: 0.7189, MRR: 0.6699\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -1.1130, rewards: 0.5931\n",
      "Iteration: 660, Train loss: -1.2174, rewards: 0.5931\n",
      "Iteration: 665, Train loss: -1.0073, rewards: 0.7131\n",
      "Iteration: 670, Train loss: -1.1555, rewards: 0.6212\n",
      "Iteration: 675, Train loss: -1.3630, rewards: 0.6469\n",
      "Iteration: 680, Train loss: -1.1548, rewards: 0.5692\n",
      "Iteration: 685, Train loss: -1.2537, rewards: 0.5773\n",
      "Iteration: 690, Train loss: -1.1369, rewards: 0.6308\n",
      "Iteration: 695, Train loss: -1.2058, rewards: 0.6146\n",
      "Iteration: 700, Train loss: -1.2407, rewards: 0.5400\n",
      "Eval:\n",
      "Hits@1: 0.6406, Hits@3: 0.6866, Hits@10: 0.7097, MRR: 0.6663\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -1.1153, rewards: 0.6542\n",
      "Iteration: 710, Train loss: -1.2290, rewards: 0.5612\n",
      "Iteration: 715, Train loss: -1.2691, rewards: 0.6350\n",
      "Iteration: 720, Train loss: -1.1962, rewards: 0.6285\n",
      "Iteration: 725, Train loss: -1.2529, rewards: 0.5992\n",
      "Iteration: 730, Train loss: -1.2131, rewards: 0.6038\n",
      "Iteration: 735, Train loss: -1.3074, rewards: 0.5635\n",
      "Iteration: 740, Train loss: -1.3411, rewards: 0.5865\n",
      "Iteration: 745, Train loss: -1.1045, rewards: 0.6612\n",
      "Iteration: 750, Train loss: -1.1711, rewards: 0.6023\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6912, Hits@10: 0.7051, MRR: 0.6856\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -1.1825, rewards: 0.5469\n",
      "Iteration: 760, Train loss: -1.2061, rewards: 0.5415\n",
      "Iteration: 765, Train loss: -1.3567, rewards: 0.5500\n",
      "Iteration: 770, Train loss: -1.1348, rewards: 0.5900\n",
      "Iteration: 775, Train loss: -1.1868, rewards: 0.6508\n",
      "Iteration: 780, Train loss: -1.2465, rewards: 0.6365\n",
      "Iteration: 785, Train loss: -1.1825, rewards: 0.6281\n",
      "Iteration: 790, Train loss: -1.3460, rewards: 0.6023\n",
      "Iteration: 795, Train loss: -1.2154, rewards: 0.6112\n",
      "Iteration: 800, Train loss: -1.2854, rewards: 0.6635\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6912, Hits@10: 0.7051, MRR: 0.6747\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -1.2232, rewards: 0.5612\n",
      "Iteration: 810, Train loss: -1.1568, rewards: 0.6142\n",
      "Iteration: 815, Train loss: -1.2718, rewards: 0.6665\n",
      "Iteration: 820, Train loss: -1.2015, rewards: 0.6285\n",
      "Iteration: 825, Train loss: -1.1702, rewards: 0.6262\n",
      "Iteration: 830, Train loss: -1.0742, rewards: 0.6700\n",
      "Iteration: 835, Train loss: -1.1620, rewards: 0.6165\n",
      "Iteration: 840, Train loss: -0.9780, rewards: 0.6350\n",
      "Iteration: 845, Train loss: -1.3512, rewards: 0.5958\n",
      "Iteration: 850, Train loss: -1.1768, rewards: 0.6042\n",
      "Eval:\n",
      "Hits@1: 0.6498, Hits@3: 0.6866, Hits@10: 0.7143, MRR: 0.6728\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -1.1386, rewards: 0.6435\n",
      "Iteration: 860, Train loss: -1.2193, rewards: 0.6277\n",
      "Iteration: 865, Train loss: -1.2550, rewards: 0.6773\n",
      "Iteration: 870, Train loss: -1.3174, rewards: 0.6408\n",
      "Iteration: 875, Train loss: -0.9585, rewards: 0.6765\n",
      "Iteration: 880, Train loss: -1.2015, rewards: 0.6612\n",
      "Iteration: 885, Train loss: -1.1304, rewards: 0.5554\n",
      "Iteration: 890, Train loss: -1.3491, rewards: 0.5608\n",
      "Iteration: 895, Train loss: -1.1978, rewards: 0.6573\n",
      "Iteration: 900, Train loss: -1.3012, rewards: 0.6304\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7097, MRR: 0.6761\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -1.2365, rewards: 0.6615\n",
      "Iteration: 910, Train loss: -1.1596, rewards: 0.6473\n",
      "Iteration: 915, Train loss: -1.2482, rewards: 0.5600\n",
      "Iteration: 920, Train loss: -1.1993, rewards: 0.6396\n",
      "Iteration: 925, Train loss: -1.1648, rewards: 0.6246\n",
      "Iteration: 930, Train loss: -1.2188, rewards: 0.5815\n",
      "Iteration: 935, Train loss: -1.2463, rewards: 0.6123\n",
      "Iteration: 940, Train loss: -1.1937, rewards: 0.7081\n",
      "Iteration: 945, Train loss: -1.1898, rewards: 0.5565\n",
      "Iteration: 950, Train loss: -1.1164, rewards: 0.6612\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6866, Hits@10: 0.7051, MRR: 0.6728\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -1.2024, rewards: 0.6127\n",
      "Iteration: 960, Train loss: -1.2702, rewards: 0.5396\n",
      "Iteration: 965, Train loss: -1.0421, rewards: 0.5904\n",
      "Iteration: 970, Train loss: -1.2173, rewards: 0.6446\n",
      "Iteration: 975, Train loss: -1.2320, rewards: 0.6319\n",
      "Iteration: 980, Train loss: -1.2417, rewards: 0.6308\n",
      "Iteration: 985, Train loss: -1.2803, rewards: 0.6085\n",
      "Iteration: 990, Train loss: -1.0227, rewards: 0.6562\n",
      "Iteration: 995, Train loss: -1.2175, rewards: 0.5938\n",
      "Iteration: 1000, Train loss: -1.2999, rewards: 0.5638\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6754\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -1.3999, rewards: 0.5608\n",
      "Iteration: 1010, Train loss: -1.2434, rewards: 0.6646\n",
      "Iteration: 1015, Train loss: -1.1747, rewards: 0.6865\n",
      "Iteration: 1020, Train loss: -1.2305, rewards: 0.6081\n",
      "Iteration: 1025, Train loss: -1.2182, rewards: 0.6085\n",
      "Iteration: 1030, Train loss: -1.2040, rewards: 0.6258\n",
      "Iteration: 1035, Train loss: -1.1006, rewards: 0.6550\n",
      "Iteration: 1040, Train loss: -1.2448, rewards: 0.5277\n",
      "Iteration: 1045, Train loss: -1.3044, rewards: 0.5735\n",
      "Iteration: 1050, Train loss: -1.0383, rewards: 0.7027\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6784\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -1.0773, rewards: 0.6369\n",
      "Iteration: 1060, Train loss: -1.2402, rewards: 0.5619\n",
      "Iteration: 1065, Train loss: -1.2228, rewards: 0.5681\n",
      "Iteration: 1070, Train loss: -1.1019, rewards: 0.5712\n",
      "Iteration: 1075, Train loss: -1.3662, rewards: 0.6150\n",
      "Iteration: 1080, Train loss: -1.1773, rewards: 0.5742\n",
      "Iteration: 1085, Train loss: -1.1400, rewards: 0.6338\n",
      "Iteration: 1090, Train loss: -1.2520, rewards: 0.6388\n",
      "Iteration: 1095, Train loss: -1.2165, rewards: 0.5562\n",
      "Iteration: 1100, Train loss: -1.2573, rewards: 0.6219\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6792\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.9821, rewards: 0.6354\n",
      "Iteration: 1110, Train loss: -1.1545, rewards: 0.7369\n",
      "Iteration: 1115, Train loss: -1.1746, rewards: 0.5973\n",
      "Iteration: 1120, Train loss: -1.2404, rewards: 0.5562\n",
      "Iteration: 1125, Train loss: -1.2924, rewards: 0.5423\n",
      "Iteration: 1130, Train loss: -1.1762, rewards: 0.6796\n",
      "Iteration: 1135, Train loss: -1.1864, rewards: 0.6681\n",
      "Iteration: 1140, Train loss: -1.1955, rewards: 0.6508\n",
      "Iteration: 1145, Train loss: -1.0728, rewards: 0.6477\n",
      "Iteration: 1150, Train loss: -1.1006, rewards: 0.6042\n",
      "Eval:\n",
      "Hits@1: 0.6682, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6835\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -1.1832, rewards: 0.6746\n",
      "Iteration: 1160, Train loss: -1.1957, rewards: 0.6673\n",
      "Iteration: 1165, Train loss: -1.1493, rewards: 0.6912\n",
      "Iteration: 1170, Train loss: -1.0679, rewards: 0.6062\n",
      "Iteration: 1175, Train loss: -1.1723, rewards: 0.6623\n",
      "Iteration: 1180, Train loss: -1.3576, rewards: 0.5719\n",
      "Iteration: 1185, Train loss: -1.3042, rewards: 0.6077\n",
      "Iteration: 1190, Train loss: -1.3130, rewards: 0.5285\n",
      "Iteration: 1195, Train loss: -1.3082, rewards: 0.5873\n",
      "Iteration: 1200, Train loss: -1.3104, rewards: 0.5715\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6959, Hits@10: 0.7005, MRR: 0.6752\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -1.2522, rewards: 0.6435\n",
      "Iteration: 1210, Train loss: -1.1851, rewards: 0.7085\n",
      "Iteration: 1215, Train loss: -1.2342, rewards: 0.6088\n",
      "Iteration: 1220, Train loss: -1.1847, rewards: 0.5504\n",
      "Iteration: 1225, Train loss: -1.0496, rewards: 0.5819\n",
      "Iteration: 1230, Train loss: -1.2064, rewards: 0.6588\n",
      "Iteration: 1235, Train loss: -1.0532, rewards: 0.6858\n",
      "Iteration: 1240, Train loss: -1.2375, rewards: 0.6446\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -1.0758, rewards: 0.6627\n",
      "Iteration: 1250, Train loss: -0.9768, rewards: 0.6604\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.6959, Hits@10: 0.7097, MRR: 0.6823\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -1.3258, rewards: 0.5827\n",
      "Iteration: 1260, Train loss: -1.0478, rewards: 0.6731\n",
      "Iteration: 1265, Train loss: -1.2064, rewards: 0.5977\n",
      "Iteration: 1270, Train loss: -1.1705, rewards: 0.6223\n",
      "Iteration: 1275, Train loss: -1.0365, rewards: 0.7131\n",
      "Iteration: 1280, Train loss: -1.2186, rewards: 0.6219\n",
      "Iteration: 1285, Train loss: -1.0590, rewards: 0.5950\n",
      "Iteration: 1290, Train loss: -1.2367, rewards: 0.6242\n",
      "Iteration: 1295, Train loss: -1.1689, rewards: 0.6212\n",
      "Iteration: 1300, Train loss: -1.0856, rewards: 0.6477\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6829\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -1.1727, rewards: 0.6119\n",
      "Iteration: 1310, Train loss: -1.0871, rewards: 0.6904\n",
      "Iteration: 1315, Train loss: -1.2223, rewards: 0.6446\n",
      "Iteration: 1320, Train loss: -1.1676, rewards: 0.6785\n",
      "Iteration: 1325, Train loss: -1.0740, rewards: 0.6331\n",
      "Iteration: 1330, Train loss: -1.3141, rewards: 0.6019\n",
      "Iteration: 1335, Train loss: -1.2118, rewards: 0.5996\n",
      "Iteration: 1340, Train loss: -1.2584, rewards: 0.6235\n",
      "Iteration: 1345, Train loss: -1.1583, rewards: 0.6077\n",
      "Iteration: 1350, Train loss: -1.1008, rewards: 0.6288\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6795\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -1.1709, rewards: 0.6212\n",
      "Iteration: 1360, Train loss: -1.3885, rewards: 0.6088\n",
      "Iteration: 1365, Train loss: -1.1828, rewards: 0.5696\n",
      "Iteration: 1370, Train loss: -1.2134, rewards: 0.6677\n",
      "Iteration: 1375, Train loss: -1.1077, rewards: 0.5915\n",
      "Iteration: 1380, Train loss: -1.2035, rewards: 0.6642\n",
      "Iteration: 1385, Train loss: -1.1791, rewards: 0.6223\n",
      "Iteration: 1390, Train loss: -1.0986, rewards: 0.6031\n",
      "Iteration: 1395, Train loss: -1.2887, rewards: 0.6450\n",
      "Iteration: 1400, Train loss: -1.2082, rewards: 0.6104\n",
      "Eval:\n",
      "Hits@1: 0.6498, Hits@3: 0.6912, Hits@10: 0.7097, MRR: 0.6734\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -1.1458, rewards: 0.6027\n",
      "Iteration: 1410, Train loss: -1.2535, rewards: 0.5700\n",
      "Iteration: 1415, Train loss: -1.1748, rewards: 0.6996\n",
      "Iteration: 1420, Train loss: -1.1768, rewards: 0.6258\n",
      "Iteration: 1425, Train loss: -1.2248, rewards: 0.6312\n",
      "Iteration: 1430, Train loss: -1.2999, rewards: 0.6135\n",
      "Iteration: 1435, Train loss: -1.2698, rewards: 0.5854\n",
      "Iteration: 1440, Train loss: -1.1624, rewards: 0.6619\n",
      "Iteration: 1445, Train loss: -1.1674, rewards: 0.6750\n",
      "Iteration: 1450, Train loss: -1.2644, rewards: 0.5892\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6777\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -1.1795, rewards: 0.6519\n",
      "Iteration: 1460, Train loss: -1.1330, rewards: 0.6742\n",
      "Iteration: 1465, Train loss: -1.2347, rewards: 0.6969\n",
      "Iteration: 1470, Train loss: -1.1290, rewards: 0.6269\n",
      "Iteration: 1475, Train loss: -1.0600, rewards: 0.6362\n",
      "Iteration: 1480, Train loss: -1.0775, rewards: 0.6915\n",
      "Iteration: 1485, Train loss: -1.0323, rewards: 0.6965\n",
      "Iteration: 1490, Train loss: -1.3032, rewards: 0.6323\n",
      "Iteration: 1495, Train loss: -1.1186, rewards: 0.6731\n",
      "Iteration: 1500, Train loss: -1.0161, rewards: 0.6662\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6959, Hits@10: 0.7189, MRR: 0.6899\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -1.0932, rewards: 0.6200\n",
      "Iteration: 1510, Train loss: -1.2183, rewards: 0.5627\n",
      "Iteration: 1515, Train loss: -1.2926, rewards: 0.5715\n",
      "Iteration: 1520, Train loss: -1.1686, rewards: 0.6496\n",
      "Iteration: 1525, Train loss: -1.2232, rewards: 0.6081\n",
      "Iteration: 1530, Train loss: -1.1167, rewards: 0.6515\n",
      "Iteration: 1535, Train loss: -1.1598, rewards: 0.6408\n",
      "Iteration: 1540, Train loss: -1.1123, rewards: 0.5919\n",
      "Iteration: 1545, Train loss: -1.2598, rewards: 0.6565\n",
      "Iteration: 1550, Train loss: -1.0572, rewards: 0.7050\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6783\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -1.2205, rewards: 0.6427\n",
      "Iteration: 1560, Train loss: -1.1488, rewards: 0.6862\n",
      "Iteration: 1565, Train loss: -1.1750, rewards: 0.6719\n",
      "Iteration: 1570, Train loss: -1.2863, rewards: 0.5727\n",
      "Iteration: 1575, Train loss: -1.2280, rewards: 0.5946\n",
      "Iteration: 1580, Train loss: -1.0420, rewards: 0.6427\n",
      "Iteration: 1585, Train loss: -1.2949, rewards: 0.6346\n",
      "Iteration: 1590, Train loss: -1.1746, rewards: 0.6608\n",
      "Iteration: 1595, Train loss: -1.3735, rewards: 0.5796\n",
      "Iteration: 1600, Train loss: -1.1956, rewards: 0.5473\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6859\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -1.1248, rewards: 0.6258\n",
      "Iteration: 1610, Train loss: -1.2032, rewards: 0.6785\n",
      "Iteration: 1615, Train loss: -1.1798, rewards: 0.6762\n",
      "Iteration: 1620, Train loss: -1.1852, rewards: 0.6296\n",
      "Iteration: 1625, Train loss: -1.2575, rewards: 0.6081\n",
      "Iteration: 1630, Train loss: -1.1138, rewards: 0.6223\n",
      "Iteration: 1635, Train loss: -1.1178, rewards: 0.6042\n",
      "Iteration: 1640, Train loss: -1.2455, rewards: 0.6577\n",
      "Iteration: 1645, Train loss: -1.3580, rewards: 0.6012\n",
      "Iteration: 1650, Train loss: -1.2275, rewards: 0.6592\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.6959, Hits@10: 0.7143, MRR: 0.6866\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -1.1179, rewards: 0.5881\n",
      "Iteration: 1660, Train loss: -1.2246, rewards: 0.6046\n",
      "Iteration: 1665, Train loss: -1.1600, rewards: 0.6119\n",
      "Iteration: 1670, Train loss: -1.2142, rewards: 0.6281\n",
      "Iteration: 1675, Train loss: -1.3386, rewards: 0.5938\n",
      "Iteration: 1680, Train loss: -1.1941, rewards: 0.6081\n",
      "Iteration: 1685, Train loss: -1.2996, rewards: 0.6581\n",
      "Iteration: 1690, Train loss: -1.0069, rewards: 0.6088\n",
      "Iteration: 1695, Train loss: -1.1449, rewards: 0.6627\n",
      "Iteration: 1700, Train loss: -1.1494, rewards: 0.6042\n",
      "Eval:\n",
      "Hits@1: 0.6406, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6673\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -1.3214, rewards: 0.5873\n",
      "Iteration: 1710, Train loss: -1.2336, rewards: 0.6027\n",
      "Iteration: 1715, Train loss: -1.2445, rewards: 0.6665\n",
      "Iteration: 1720, Train loss: -1.2467, rewards: 0.6812\n",
      "Iteration: 1725, Train loss: -1.0876, rewards: 0.6542\n",
      "Iteration: 1730, Train loss: -1.1236, rewards: 0.6462\n",
      "Iteration: 1735, Train loss: -1.0655, rewards: 0.6750\n",
      "Iteration: 1740, Train loss: -1.1282, rewards: 0.6773\n",
      "Iteration: 1745, Train loss: -1.1615, rewards: 0.5673\n",
      "Iteration: 1750, Train loss: -1.2216, rewards: 0.6650\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7189, MRR: 0.6795\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -1.3954, rewards: 0.6227\n",
      "Iteration: 1760, Train loss: -1.2580, rewards: 0.5862\n",
      "Iteration: 1765, Train loss: -1.1396, rewards: 0.6692\n",
      "Iteration: 1770, Train loss: -1.1277, rewards: 0.6500\n",
      "Iteration: 1775, Train loss: -1.2365, rewards: 0.6742\n",
      "Iteration: 1780, Train loss: -1.1085, rewards: 0.6469\n",
      "Iteration: 1785, Train loss: -1.1606, rewards: 0.6842\n",
      "Iteration: 1790, Train loss: -1.3101, rewards: 0.6192\n",
      "Iteration: 1795, Train loss: -1.3130, rewards: 0.6346\n",
      "Iteration: 1800, Train loss: -1.2570, rewards: 0.6654\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6800\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -1.2678, rewards: 0.6277\n",
      "Iteration: 1810, Train loss: -1.0329, rewards: 0.7069\n",
      "Iteration: 1815, Train loss: -1.0174, rewards: 0.6696\n",
      "Iteration: 1820, Train loss: -0.9986, rewards: 0.6862\n",
      "Iteration: 1825, Train loss: -1.2423, rewards: 0.6373\n",
      "Iteration: 1830, Train loss: -1.2349, rewards: 0.6323\n",
      "Iteration: 1835, Train loss: -1.2268, rewards: 0.6396\n",
      "Iteration: 1840, Train loss: -1.3422, rewards: 0.5658\n",
      "Iteration: 1845, Train loss: -1.2137, rewards: 0.6242\n",
      "Iteration: 1850, Train loss: -1.1705, rewards: 0.6262\n",
      "Eval:\n",
      "Hits@1: 0.6498, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6730\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -1.1672, rewards: 0.6519\n",
      "Iteration: 1860, Train loss: -1.2276, rewards: 0.5827\n",
      "Iteration: 1865, Train loss: -1.2539, rewards: 0.5788\n",
      "Iteration: 1870, Train loss: -1.1474, rewards: 0.6331\n",
      "Iteration: 1875, Train loss: -1.1459, rewards: 0.6681\n",
      "Iteration: 1880, Train loss: -0.9964, rewards: 0.6473\n",
      "Iteration: 1885, Train loss: -1.0461, rewards: 0.6338\n",
      "Iteration: 1890, Train loss: -1.2880, rewards: 0.6004\n",
      "Iteration: 1895, Train loss: -1.2803, rewards: 0.5842\n",
      "Iteration: 1900, Train loss: -1.1195, rewards: 0.6431\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6912, Hits@10: 0.7097, MRR: 0.6773\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -1.0402, rewards: 0.6915\n",
      "Iteration: 1910, Train loss: -1.0529, rewards: 0.7012\n",
      "Iteration: 1915, Train loss: -1.1653, rewards: 0.6835\n",
      "Iteration: 1920, Train loss: -1.1139, rewards: 0.6831\n",
      "Iteration: 1925, Train loss: -1.1476, rewards: 0.7054\n",
      "Iteration: 1930, Train loss: -1.2058, rewards: 0.6404\n",
      "Iteration: 1935, Train loss: -1.2898, rewards: 0.5304\n",
      "Iteration: 1940, Train loss: -1.1775, rewards: 0.5738\n",
      "Iteration: 1945, Train loss: -1.2683, rewards: 0.6400\n",
      "Iteration: 1950, Train loss: -1.2046, rewards: 0.6412\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.6912, Hits@10: 0.7097, MRR: 0.6801\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -1.0406, rewards: 0.5985\n",
      "Iteration: 1960, Train loss: -1.1839, rewards: 0.6138\n",
      "Iteration: 1965, Train loss: -1.0173, rewards: 0.6415\n",
      "Iteration: 1970, Train loss: -1.0915, rewards: 0.6585\n",
      "Iteration: 1975, Train loss: -1.1671, rewards: 0.6281\n",
      "Iteration: 1980, Train loss: -1.1352, rewards: 0.6765\n",
      "Iteration: 1985, Train loss: -1.0754, rewards: 0.6838\n",
      "Iteration: 1990, Train loss: -1.1169, rewards: 0.6415\n",
      "Iteration: 1995, Train loss: -1.1111, rewards: 0.7050\n",
      "Iteration: 2000, Train loss: -1.2204, rewards: 0.6827\n",
      "Eval:\n",
      "Hits@1: 0.6498, Hits@3: 0.6959, Hits@10: 0.7189, MRR: 0.6772\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personleadsorganization//test_beam/ ]\n",
      "Hits@1: 0.5086, Hits@3: 0.6552, Hits@10: 0.7629, MRR: 0.5953\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8394605190469031 (179 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 22:07:32,450]\u001b[0m Trial 1 finished with value: 0.8394605190469031 and parameters: {'lr': 0.0044254826028598685, 'bs': 26, 'b': 0.4062481708120685, 'l': 0.24826128393010238, 'ee': 50}. Best is trial 0 with value: 0.8691002909875059.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.6869, rewards: 0.3959\n",
      "Iteration: 10, Train loss: -0.8282, rewards: 0.4933\n",
      "Iteration: 15, Train loss: -0.8756, rewards: 0.5424\n",
      "Iteration: 20, Train loss: -0.8906, rewards: 0.5207\n",
      "Iteration: 25, Train loss: -0.8235, rewards: 0.5718\n",
      "Iteration: 30, Train loss: -0.7873, rewards: 0.5439\n",
      "Iteration: 35, Train loss: -0.8250, rewards: 0.5678\n",
      "Iteration: 40, Train loss: -0.8293, rewards: 0.4973\n",
      "Iteration: 45, Train loss: -0.8329, rewards: 0.5810\n",
      "Iteration: 50, Train loss: -0.8911, rewards: 0.5976\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.6805\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.7372, rewards: 0.5978\n",
      "Iteration: 60, Train loss: -0.7890, rewards: 0.6091\n",
      "Iteration: 65, Train loss: -0.8565, rewards: 0.5641\n",
      "Iteration: 70, Train loss: -0.8563, rewards: 0.5885\n",
      "Iteration: 75, Train loss: -0.7693, rewards: 0.6753\n",
      "Iteration: 80, Train loss: -0.8645, rewards: 0.6128\n",
      "Iteration: 85, Train loss: -0.8689, rewards: 0.5882\n",
      "Iteration: 90, Train loss: -0.8477, rewards: 0.6332\n",
      "Iteration: 95, Train loss: -0.8212, rewards: 0.6228\n",
      "Iteration: 100, Train loss: -0.8827, rewards: 0.6546\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.6831\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.8703, rewards: 0.6492\n",
      "Iteration: 110, Train loss: -0.8854, rewards: 0.6667\n",
      "Iteration: 115, Train loss: -0.9492, rewards: 0.6157\n",
      "Iteration: 120, Train loss: -0.9705, rewards: 0.6317\n",
      "Iteration: 125, Train loss: -0.9123, rewards: 0.6307\n",
      "Iteration: 130, Train loss: -0.9516, rewards: 0.6071\n",
      "Iteration: 135, Train loss: -0.9514, rewards: 0.6278\n",
      "Iteration: 140, Train loss: -0.8542, rewards: 0.6522\n",
      "Iteration: 145, Train loss: -0.8350, rewards: 0.6388\n",
      "Iteration: 150, Train loss: -0.8553, rewards: 0.6561\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.6993\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.8963, rewards: 0.6772\n",
      "Iteration: 160, Train loss: -0.8728, rewards: 0.6394\n",
      "Iteration: 165, Train loss: -0.8246, rewards: 0.6774\n",
      "Iteration: 170, Train loss: -0.8832, rewards: 0.6587\n",
      "Iteration: 175, Train loss: -0.9460, rewards: 0.6618\n",
      "Iteration: 180, Train loss: -0.8690, rewards: 0.6709\n",
      "Iteration: 185, Train loss: -0.8748, rewards: 0.6927\n",
      "Iteration: 190, Train loss: -0.8938, rewards: 0.6730\n",
      "Iteration: 195, Train loss: -0.9969, rewards: 0.6546\n",
      "Iteration: 200, Train loss: -0.8155, rewards: 0.6883\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7012\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.9004, rewards: 0.6839\n",
      "Iteration: 210, Train loss: -0.8952, rewards: 0.6307\n",
      "Iteration: 215, Train loss: -0.8897, rewards: 0.6337\n",
      "Iteration: 220, Train loss: -0.8895, rewards: 0.7078\n",
      "Iteration: 225, Train loss: -0.9286, rewards: 0.6584\n",
      "Iteration: 230, Train loss: -0.8646, rewards: 0.6861\n",
      "Iteration: 235, Train loss: -0.8577, rewards: 0.6332\n",
      "Iteration: 240, Train loss: -0.9312, rewards: 0.6802\n",
      "Iteration: 245, Train loss: -0.9090, rewards: 0.6447\n",
      "Iteration: 250, Train loss: -0.9226, rewards: 0.6566\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7039\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.8251, rewards: 0.6637\n",
      "Iteration: 260, Train loss: -0.8717, rewards: 0.7041\n",
      "Iteration: 265, Train loss: -0.8628, rewards: 0.6929\n",
      "Iteration: 270, Train loss: -0.9326, rewards: 0.6853\n",
      "Iteration: 275, Train loss: -0.8851, rewards: 0.6747\n",
      "Iteration: 280, Train loss: -0.8980, rewards: 0.7100\n",
      "Iteration: 285, Train loss: -0.9510, rewards: 0.6771\n",
      "Iteration: 290, Train loss: -0.9582, rewards: 0.7095\n",
      "Iteration: 295, Train loss: -0.9169, rewards: 0.6897\n",
      "Iteration: 300, Train loss: -0.9787, rewards: 0.6622\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7011\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.9356, rewards: 0.6815\n",
      "Iteration: 310, Train loss: -0.8487, rewards: 0.7202\n",
      "Iteration: 315, Train loss: -0.9478, rewards: 0.6615\n",
      "Iteration: 320, Train loss: -0.8756, rewards: 0.7147\n",
      "Iteration: 325, Train loss: -0.9435, rewards: 0.6752\n",
      "Iteration: 330, Train loss: -0.8876, rewards: 0.6661\n",
      "Iteration: 335, Train loss: -0.8172, rewards: 0.6738\n",
      "Iteration: 340, Train loss: -0.8797, rewards: 0.6787\n",
      "Iteration: 345, Train loss: -0.9463, rewards: 0.6786\n",
      "Iteration: 350, Train loss: -0.8373, rewards: 0.6736\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7032\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -0.8915, rewards: 0.6695\n",
      "Iteration: 360, Train loss: -0.9679, rewards: 0.6614\n",
      "Iteration: 365, Train loss: -0.7845, rewards: 0.6941\n",
      "Iteration: 370, Train loss: -1.0195, rewards: 0.6459\n",
      "Iteration: 375, Train loss: -0.8491, rewards: 0.6527\n",
      "Iteration: 380, Train loss: -0.9090, rewards: 0.6682\n",
      "Iteration: 385, Train loss: -0.9006, rewards: 0.6609\n",
      "Iteration: 390, Train loss: -0.9229, rewards: 0.6617\n",
      "Iteration: 395, Train loss: -0.8839, rewards: 0.6937\n",
      "Iteration: 400, Train loss: -0.9286, rewards: 0.6934\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6866, Hits@10: 0.7097, MRR: 0.6884\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -0.8327, rewards: 0.7034\n",
      "Iteration: 410, Train loss: -0.8792, rewards: 0.7000\n",
      "Iteration: 415, Train loss: -0.9647, rewards: 0.6770\n",
      "Iteration: 420, Train loss: -0.9682, rewards: 0.6637\n",
      "Iteration: 425, Train loss: -0.9243, rewards: 0.6367\n",
      "Iteration: 430, Train loss: -0.9031, rewards: 0.6852\n",
      "Iteration: 435, Train loss: -0.8978, rewards: 0.6878\n",
      "Iteration: 440, Train loss: -0.9496, rewards: 0.6864\n",
      "Iteration: 445, Train loss: -0.9056, rewards: 0.6638\n",
      "Iteration: 450, Train loss: -0.8652, rewards: 0.6623\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7051, Hits@10: 0.7143, MRR: 0.6954\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -0.9334, rewards: 0.6580\n",
      "Iteration: 460, Train loss: -0.9454, rewards: 0.6638\n",
      "Iteration: 465, Train loss: -0.8590, rewards: 0.7189\n",
      "Iteration: 470, Train loss: -0.9852, rewards: 0.6860\n",
      "Iteration: 475, Train loss: -0.8637, rewards: 0.6844\n",
      "Iteration: 480, Train loss: -0.8547, rewards: 0.6829\n",
      "Iteration: 485, Train loss: -0.8607, rewards: 0.7209\n",
      "Iteration: 490, Train loss: -0.9844, rewards: 0.6687\n",
      "Iteration: 495, Train loss: -0.9400, rewards: 0.6939\n",
      "Iteration: 500, Train loss: -0.9038, rewards: 0.6622\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7060\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -0.9245, rewards: 0.6934\n",
      "Iteration: 510, Train loss: -0.8776, rewards: 0.7017\n",
      "Iteration: 515, Train loss: -0.9417, rewards: 0.6685\n",
      "Iteration: 520, Train loss: -0.9847, rewards: 0.6824\n",
      "Iteration: 525, Train loss: -0.8968, rewards: 0.6998\n",
      "Iteration: 530, Train loss: -0.8789, rewards: 0.7051\n",
      "Iteration: 535, Train loss: -0.8280, rewards: 0.6871\n",
      "Iteration: 540, Train loss: -0.9410, rewards: 0.6983\n",
      "Iteration: 545, Train loss: -0.9122, rewards: 0.7009\n",
      "Iteration: 550, Train loss: -0.9457, rewards: 0.7170\n",
      "Eval:\n",
      "Hits@1: 0.6636, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.6842\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -1.0003, rewards: 0.6972\n",
      "Iteration: 560, Train loss: -0.9637, rewards: 0.7054\n",
      "Iteration: 565, Train loss: -1.0206, rewards: 0.6902\n",
      "Iteration: 570, Train loss: -0.8726, rewards: 0.6823\n",
      "Iteration: 575, Train loss: -0.9150, rewards: 0.7033\n",
      "Iteration: 580, Train loss: -0.8509, rewards: 0.6803\n",
      "Iteration: 585, Train loss: -0.8293, rewards: 0.7105\n",
      "Iteration: 590, Train loss: -0.9266, rewards: 0.6780\n",
      "Iteration: 595, Train loss: -0.9226, rewards: 0.6991\n",
      "Iteration: 600, Train loss: -0.8848, rewards: 0.7064\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7031\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -0.8295, rewards: 0.7276\n",
      "Iteration: 610, Train loss: -0.7779, rewards: 0.6972\n",
      "Iteration: 615, Train loss: -0.9595, rewards: 0.6920\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -0.8961, rewards: 0.6852\n",
      "Iteration: 625, Train loss: -0.8991, rewards: 0.6816\n",
      "Iteration: 630, Train loss: -1.0394, rewards: 0.7128\n",
      "Iteration: 635, Train loss: -0.9510, rewards: 0.6935\n",
      "Iteration: 640, Train loss: -0.9652, rewards: 0.6816\n",
      "Iteration: 645, Train loss: -0.9847, rewards: 0.6864\n",
      "Iteration: 650, Train loss: -0.9375, rewards: 0.6531\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.6912, Hits@10: 0.7143, MRR: 0.6866\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -0.9205, rewards: 0.6988\n",
      "Iteration: 660, Train loss: -0.9982, rewards: 0.6775\n",
      "Iteration: 665, Train loss: -0.9979, rewards: 0.6691\n",
      "Iteration: 670, Train loss: -0.8298, rewards: 0.7386\n",
      "Iteration: 675, Train loss: -0.9566, rewards: 0.6797\n",
      "Iteration: 680, Train loss: -0.9344, rewards: 0.6898\n",
      "Iteration: 685, Train loss: -0.9663, rewards: 0.6859\n",
      "Iteration: 690, Train loss: -0.9013, rewards: 0.6953\n",
      "Iteration: 695, Train loss: -1.0245, rewards: 0.6885\n",
      "Iteration: 700, Train loss: -0.9753, rewards: 0.6684\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7051, Hits@10: 0.7143, MRR: 0.6956\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -1.0045, rewards: 0.6712\n",
      "Iteration: 710, Train loss: -0.8448, rewards: 0.6810\n",
      "Iteration: 715, Train loss: -0.8473, rewards: 0.6749\n",
      "Iteration: 720, Train loss: -0.8955, rewards: 0.7072\n",
      "Iteration: 725, Train loss: -0.8797, rewards: 0.7079\n",
      "Iteration: 730, Train loss: -0.9208, rewards: 0.7109\n",
      "Iteration: 735, Train loss: -1.0241, rewards: 0.6879\n",
      "Iteration: 740, Train loss: -0.9423, rewards: 0.6982\n",
      "Iteration: 745, Train loss: -0.9375, rewards: 0.6888\n",
      "Iteration: 750, Train loss: -0.9873, rewards: 0.6737\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.7051, Hits@10: 0.7143, MRR: 0.6925\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.9560, rewards: 0.6683\n",
      "Iteration: 760, Train loss: -0.9331, rewards: 0.6881\n",
      "Iteration: 765, Train loss: -0.8093, rewards: 0.7084\n",
      "Iteration: 770, Train loss: -0.9393, rewards: 0.6931\n",
      "Iteration: 775, Train loss: -0.9449, rewards: 0.6709\n",
      "Iteration: 780, Train loss: -0.9707, rewards: 0.6797\n",
      "Iteration: 785, Train loss: -0.7408, rewards: 0.7293\n",
      "Iteration: 790, Train loss: -0.9318, rewards: 0.6831\n",
      "Iteration: 795, Train loss: -0.8783, rewards: 0.6597\n",
      "Iteration: 800, Train loss: -1.0426, rewards: 0.6673\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7027\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -0.9086, rewards: 0.6789\n",
      "Iteration: 810, Train loss: -0.8321, rewards: 0.6994\n",
      "Iteration: 815, Train loss: -0.9375, rewards: 0.6822\n",
      "Iteration: 820, Train loss: -0.9444, rewards: 0.6772\n",
      "Iteration: 825, Train loss: -0.9276, rewards: 0.6713\n",
      "Iteration: 830, Train loss: -0.8291, rewards: 0.7203\n",
      "Iteration: 835, Train loss: -0.8853, rewards: 0.6658\n",
      "Iteration: 840, Train loss: -0.8770, rewards: 0.6578\n",
      "Iteration: 845, Train loss: -0.8952, rewards: 0.6990\n",
      "Iteration: 850, Train loss: -0.9125, rewards: 0.6826\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7031\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -0.8885, rewards: 0.6869\n",
      "Iteration: 860, Train loss: -0.8628, rewards: 0.6789\n",
      "Iteration: 865, Train loss: -0.9142, rewards: 0.6623\n",
      "Iteration: 870, Train loss: -0.8920, rewards: 0.7091\n",
      "Iteration: 875, Train loss: -0.9549, rewards: 0.7045\n",
      "Iteration: 880, Train loss: -0.9334, rewards: 0.6811\n",
      "Iteration: 885, Train loss: -0.9468, rewards: 0.6917\n",
      "Iteration: 890, Train loss: -0.8467, rewards: 0.7189\n",
      "Iteration: 895, Train loss: -0.9590, rewards: 0.6770\n",
      "Iteration: 900, Train loss: -0.9028, rewards: 0.6725\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7035\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -0.8611, rewards: 0.6768\n",
      "Iteration: 910, Train loss: -0.8847, rewards: 0.6932\n",
      "Iteration: 915, Train loss: -0.9784, rewards: 0.6616\n",
      "Iteration: 920, Train loss: -0.8530, rewards: 0.6842\n",
      "Iteration: 925, Train loss: -0.8635, rewards: 0.6766\n",
      "Iteration: 930, Train loss: -0.9121, rewards: 0.6873\n",
      "Iteration: 935, Train loss: -0.9292, rewards: 0.6819\n",
      "Iteration: 940, Train loss: -0.8649, rewards: 0.6747\n",
      "Iteration: 945, Train loss: -0.8885, rewards: 0.6926\n",
      "Iteration: 950, Train loss: -0.9298, rewards: 0.6858\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6962\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -0.9111, rewards: 0.6957\n",
      "Iteration: 960, Train loss: -0.8642, rewards: 0.6891\n",
      "Iteration: 965, Train loss: -0.7951, rewards: 0.7014\n",
      "Iteration: 970, Train loss: -0.8708, rewards: 0.6378\n",
      "Iteration: 975, Train loss: -0.8948, rewards: 0.6660\n",
      "Iteration: 980, Train loss: -0.8844, rewards: 0.7099\n",
      "Iteration: 985, Train loss: -0.9292, rewards: 0.7067\n",
      "Iteration: 990, Train loss: -0.9669, rewards: 0.6880\n",
      "Iteration: 995, Train loss: -0.8890, rewards: 0.6586\n",
      "Iteration: 1000, Train loss: -0.9551, rewards: 0.6962\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7006\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -0.8566, rewards: 0.7166\n",
      "Iteration: 1010, Train loss: -0.8394, rewards: 0.7340\n",
      "Iteration: 1015, Train loss: -0.8319, rewards: 0.7056\n",
      "Iteration: 1020, Train loss: -0.8331, rewards: 0.7002\n",
      "Iteration: 1025, Train loss: -0.8646, rewards: 0.6952\n",
      "Iteration: 1030, Train loss: -0.9442, rewards: 0.6592\n",
      "Iteration: 1035, Train loss: -0.9029, rewards: 0.6840\n",
      "Iteration: 1040, Train loss: -0.9434, rewards: 0.6730\n",
      "Iteration: 1045, Train loss: -0.9114, rewards: 0.6886\n",
      "Iteration: 1050, Train loss: -0.8855, rewards: 0.7124\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7062\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -0.9324, rewards: 0.7077\n",
      "Iteration: 1060, Train loss: -0.9434, rewards: 0.6802\n",
      "Iteration: 1065, Train loss: -0.9491, rewards: 0.7091\n",
      "Iteration: 1070, Train loss: -0.8481, rewards: 0.6957\n",
      "Iteration: 1075, Train loss: -0.9043, rewards: 0.7023\n",
      "Iteration: 1080, Train loss: -0.8458, rewards: 0.7011\n",
      "Iteration: 1085, Train loss: -0.9219, rewards: 0.7086\n",
      "Iteration: 1090, Train loss: -0.8836, rewards: 0.6749\n",
      "Iteration: 1095, Train loss: -0.9561, rewards: 0.6589\n",
      "Iteration: 1100, Train loss: -0.9745, rewards: 0.6867\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7035\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.9425, rewards: 0.6663\n",
      "Iteration: 1110, Train loss: -0.9036, rewards: 0.7336\n",
      "Iteration: 1115, Train loss: -0.9129, rewards: 0.6983\n",
      "Iteration: 1120, Train loss: -0.8628, rewards: 0.6732\n",
      "Iteration: 1125, Train loss: -0.9151, rewards: 0.6734\n",
      "Iteration: 1130, Train loss: -0.9190, rewards: 0.6814\n",
      "Iteration: 1135, Train loss: -0.8685, rewards: 0.6880\n",
      "Iteration: 1140, Train loss: -0.9545, rewards: 0.7052\n",
      "Iteration: 1145, Train loss: -0.8774, rewards: 0.6974\n",
      "Iteration: 1150, Train loss: -0.8285, rewards: 0.7288\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6939\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -1.0373, rewards: 0.6689\n",
      "Iteration: 1160, Train loss: -1.0171, rewards: 0.6605\n",
      "Iteration: 1165, Train loss: -0.9203, rewards: 0.7366\n",
      "Iteration: 1170, Train loss: -0.9964, rewards: 0.6598\n",
      "Iteration: 1175, Train loss: -0.9163, rewards: 0.7184\n",
      "Iteration: 1180, Train loss: -0.9282, rewards: 0.7107\n",
      "Iteration: 1185, Train loss: -0.9012, rewards: 0.6895\n",
      "Iteration: 1190, Train loss: -0.8919, rewards: 0.6693\n",
      "Iteration: 1195, Train loss: -0.9442, rewards: 0.7008\n",
      "Iteration: 1200, Train loss: -0.9174, rewards: 0.7004\n",
      "Eval:\n",
      "Hits@1: 0.7051, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7075\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -0.9540, rewards: 0.6839\n",
      "Iteration: 1210, Train loss: -0.9289, rewards: 0.7058\n",
      "Iteration: 1215, Train loss: -0.8770, rewards: 0.6853\n",
      "Iteration: 1220, Train loss: -0.9267, rewards: 0.7015\n",
      "Iteration: 1225, Train loss: -0.8574, rewards: 0.6847\n",
      "Iteration: 1230, Train loss: -0.9510, rewards: 0.7059\n",
      "Iteration: 1235, Train loss: -0.9266, rewards: 0.7179\n",
      "Iteration: 1240, Train loss: -0.8204, rewards: 0.7088\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -0.7510, rewards: 0.7094\n",
      "Iteration: 1250, Train loss: -0.8343, rewards: 0.6672\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6970\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -0.9570, rewards: 0.6630\n",
      "Iteration: 1260, Train loss: -0.9581, rewards: 0.6703\n",
      "Iteration: 1265, Train loss: -0.7964, rewards: 0.7110\n",
      "Iteration: 1270, Train loss: -0.9180, rewards: 0.6947\n",
      "Iteration: 1275, Train loss: -0.8968, rewards: 0.6809\n",
      "Iteration: 1280, Train loss: -0.8985, rewards: 0.6840\n",
      "Iteration: 1285, Train loss: -0.9629, rewards: 0.6609\n",
      "Iteration: 1290, Train loss: -0.9210, rewards: 0.7036\n",
      "Iteration: 1295, Train loss: -0.9329, rewards: 0.7236\n",
      "Iteration: 1300, Train loss: -0.8171, rewards: 0.7103\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7012\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -0.8772, rewards: 0.7028\n",
      "Iteration: 1310, Train loss: -0.8966, rewards: 0.7134\n",
      "Iteration: 1315, Train loss: -0.8435, rewards: 0.7159\n",
      "Iteration: 1320, Train loss: -0.8715, rewards: 0.6919\n",
      "Iteration: 1325, Train loss: -0.9284, rewards: 0.7001\n",
      "Iteration: 1330, Train loss: -0.9393, rewards: 0.7232\n",
      "Iteration: 1335, Train loss: -0.9005, rewards: 0.7007\n",
      "Iteration: 1340, Train loss: -0.8739, rewards: 0.7261\n",
      "Iteration: 1345, Train loss: -0.8358, rewards: 0.7078\n",
      "Iteration: 1350, Train loss: -0.8870, rewards: 0.6868\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6985\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -0.9518, rewards: 0.6826\n",
      "Iteration: 1360, Train loss: -0.9346, rewards: 0.6693\n",
      "Iteration: 1365, Train loss: -0.8802, rewards: 0.7080\n",
      "Iteration: 1370, Train loss: -0.8995, rewards: 0.7181\n",
      "Iteration: 1375, Train loss: -0.8084, rewards: 0.7084\n",
      "Iteration: 1380, Train loss: -0.9087, rewards: 0.6915\n",
      "Iteration: 1385, Train loss: -0.9718, rewards: 0.6809\n",
      "Iteration: 1390, Train loss: -0.9231, rewards: 0.6935\n",
      "Iteration: 1395, Train loss: -0.9575, rewards: 0.6675\n",
      "Iteration: 1400, Train loss: -0.9341, rewards: 0.6950\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6864\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -0.9119, rewards: 0.6975\n",
      "Iteration: 1410, Train loss: -0.9441, rewards: 0.6744\n",
      "Iteration: 1415, Train loss: -0.8591, rewards: 0.6928\n",
      "Iteration: 1420, Train loss: -1.0156, rewards: 0.6815\n",
      "Iteration: 1425, Train loss: -0.8995, rewards: 0.7008\n",
      "Iteration: 1430, Train loss: -0.8423, rewards: 0.7264\n",
      "Iteration: 1435, Train loss: -0.9230, rewards: 0.6992\n",
      "Iteration: 1440, Train loss: -0.9605, rewards: 0.7047\n",
      "Iteration: 1445, Train loss: -0.8919, rewards: 0.6813\n",
      "Iteration: 1450, Train loss: -0.8689, rewards: 0.7166\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6939\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -0.8550, rewards: 0.6728\n",
      "Iteration: 1460, Train loss: -0.7928, rewards: 0.6770\n",
      "Iteration: 1465, Train loss: -0.8728, rewards: 0.7132\n",
      "Iteration: 1470, Train loss: -0.9190, rewards: 0.6616\n",
      "Iteration: 1475, Train loss: -0.8242, rewards: 0.6642\n",
      "Iteration: 1480, Train loss: -0.9067, rewards: 0.6991\n",
      "Iteration: 1485, Train loss: -0.9281, rewards: 0.6777\n",
      "Iteration: 1490, Train loss: -0.8761, rewards: 0.7018\n",
      "Iteration: 1495, Train loss: -0.9695, rewards: 0.6834\n",
      "Iteration: 1500, Train loss: -0.9298, rewards: 0.6906\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6960\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -0.8944, rewards: 0.6769\n",
      "Iteration: 1510, Train loss: -0.8339, rewards: 0.7084\n",
      "Iteration: 1515, Train loss: -0.9212, rewards: 0.6925\n",
      "Iteration: 1520, Train loss: -0.9086, rewards: 0.6986\n",
      "Iteration: 1525, Train loss: -0.7672, rewards: 0.7263\n",
      "Iteration: 1530, Train loss: -0.8947, rewards: 0.7117\n",
      "Iteration: 1535, Train loss: -0.8218, rewards: 0.7255\n",
      "Iteration: 1540, Train loss: -0.9345, rewards: 0.6844\n",
      "Iteration: 1545, Train loss: -0.8277, rewards: 0.7015\n",
      "Iteration: 1550, Train loss: -0.8650, rewards: 0.7118\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7002\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.9462, rewards: 0.6822\n",
      "Iteration: 1560, Train loss: -0.8164, rewards: 0.7308\n",
      "Iteration: 1565, Train loss: -0.9053, rewards: 0.6890\n",
      "Iteration: 1570, Train loss: -0.9117, rewards: 0.7096\n",
      "Iteration: 1575, Train loss: -0.9240, rewards: 0.6852\n",
      "Iteration: 1580, Train loss: -0.8855, rewards: 0.6768\n",
      "Iteration: 1585, Train loss: -0.8716, rewards: 0.7230\n",
      "Iteration: 1590, Train loss: -0.7594, rewards: 0.7367\n",
      "Iteration: 1595, Train loss: -0.8419, rewards: 0.7181\n",
      "Iteration: 1600, Train loss: -0.8815, rewards: 0.6678\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7060\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.9477, rewards: 0.6774\n",
      "Iteration: 1610, Train loss: -0.9622, rewards: 0.7020\n",
      "Iteration: 1615, Train loss: -0.8766, rewards: 0.7042\n",
      "Iteration: 1620, Train loss: -0.8974, rewards: 0.6919\n",
      "Iteration: 1625, Train loss: -0.9154, rewards: 0.6863\n",
      "Iteration: 1630, Train loss: -0.8909, rewards: 0.7155\n",
      "Iteration: 1635, Train loss: -0.8548, rewards: 0.6687\n",
      "Iteration: 1640, Train loss: -0.8677, rewards: 0.6957\n",
      "Iteration: 1645, Train loss: -0.8576, rewards: 0.7280\n",
      "Iteration: 1650, Train loss: -0.9773, rewards: 0.6854\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6932\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -0.9334, rewards: 0.6952\n",
      "Iteration: 1660, Train loss: -0.9599, rewards: 0.6709\n",
      "Iteration: 1665, Train loss: -0.9031, rewards: 0.6698\n",
      "Iteration: 1670, Train loss: -0.9081, rewards: 0.6814\n",
      "Iteration: 1675, Train loss: -0.9718, rewards: 0.7102\n",
      "Iteration: 1680, Train loss: -0.8693, rewards: 0.7059\n",
      "Iteration: 1685, Train loss: -0.9103, rewards: 0.7009\n",
      "Iteration: 1690, Train loss: -0.9072, rewards: 0.6947\n",
      "Iteration: 1695, Train loss: -0.9576, rewards: 0.7219\n",
      "Iteration: 1700, Train loss: -0.9078, rewards: 0.6751\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6922\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -0.8368, rewards: 0.7022\n",
      "Iteration: 1710, Train loss: -0.8749, rewards: 0.6971\n",
      "Iteration: 1715, Train loss: -0.9223, rewards: 0.6874\n",
      "Iteration: 1720, Train loss: -0.8842, rewards: 0.6956\n",
      "Iteration: 1725, Train loss: -0.9383, rewards: 0.6894\n",
      "Iteration: 1730, Train loss: -0.9558, rewards: 0.6793\n",
      "Iteration: 1735, Train loss: -0.9609, rewards: 0.6972\n",
      "Iteration: 1740, Train loss: -0.9651, rewards: 0.6591\n",
      "Iteration: 1745, Train loss: -0.9384, rewards: 0.7191\n",
      "Iteration: 1750, Train loss: -0.9920, rewards: 0.6942\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7014\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.8103, rewards: 0.7156\n",
      "Iteration: 1760, Train loss: -0.9654, rewards: 0.6787\n",
      "Iteration: 1765, Train loss: -0.9204, rewards: 0.6931\n",
      "Iteration: 1770, Train loss: -0.8240, rewards: 0.7336\n",
      "Iteration: 1775, Train loss: -0.9051, rewards: 0.7164\n",
      "Iteration: 1780, Train loss: -0.8154, rewards: 0.6803\n",
      "Iteration: 1785, Train loss: -0.9168, rewards: 0.7005\n",
      "Iteration: 1790, Train loss: -0.9181, rewards: 0.7017\n",
      "Iteration: 1795, Train loss: -0.8937, rewards: 0.6941\n",
      "Iteration: 1800, Train loss: -0.9338, rewards: 0.6712\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6960\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -0.8956, rewards: 0.7193\n",
      "Iteration: 1810, Train loss: -0.8962, rewards: 0.7326\n",
      "Iteration: 1815, Train loss: -0.9679, rewards: 0.6872\n",
      "Iteration: 1820, Train loss: -0.9278, rewards: 0.7056\n",
      "Iteration: 1825, Train loss: -0.9593, rewards: 0.6913\n",
      "Iteration: 1830, Train loss: -0.9538, rewards: 0.7004\n",
      "Iteration: 1835, Train loss: -0.8736, rewards: 0.6956\n",
      "Iteration: 1840, Train loss: -0.9410, rewards: 0.7036\n",
      "Iteration: 1845, Train loss: -0.8909, rewards: 0.6857\n",
      "Iteration: 1850, Train loss: -0.8491, rewards: 0.7007\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6914\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -0.8627, rewards: 0.6983\n",
      "Iteration: 1860, Train loss: -0.9186, rewards: 0.7182\n",
      "Iteration: 1865, Train loss: -0.9103, rewards: 0.6787\n",
      "Iteration: 1870, Train loss: -0.9138, rewards: 0.6762\n",
      "Iteration: 1875, Train loss: -0.9191, rewards: 0.7112\n",
      "Iteration: 1880, Train loss: -0.8976, rewards: 0.6978\n",
      "Iteration: 1885, Train loss: -0.9345, rewards: 0.6599\n",
      "Iteration: 1890, Train loss: -0.8737, rewards: 0.6680\n",
      "Iteration: 1895, Train loss: -0.9123, rewards: 0.7100\n",
      "Iteration: 1900, Train loss: -0.8776, rewards: 0.6837\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7055\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -0.9631, rewards: 0.6708\n",
      "Iteration: 1910, Train loss: -0.9492, rewards: 0.6786\n",
      "Iteration: 1915, Train loss: -0.9584, rewards: 0.6773\n",
      "Iteration: 1920, Train loss: -0.9503, rewards: 0.6829\n",
      "Iteration: 1925, Train loss: -0.8927, rewards: 0.6652\n",
      "Iteration: 1930, Train loss: -0.9188, rewards: 0.7059\n",
      "Iteration: 1935, Train loss: -0.8638, rewards: 0.6872\n",
      "Iteration: 1940, Train loss: -0.9146, rewards: 0.6618\n",
      "Iteration: 1945, Train loss: -0.9106, rewards: 0.6914\n",
      "Iteration: 1950, Train loss: -0.8694, rewards: 0.7034\n",
      "Eval:\n",
      "Hits@1: 0.6774, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6939\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -0.9089, rewards: 0.6765\n",
      "Iteration: 1960, Train loss: -0.8986, rewards: 0.6978\n",
      "Iteration: 1965, Train loss: -0.8907, rewards: 0.6943\n",
      "Iteration: 1970, Train loss: -0.8996, rewards: 0.7062\n",
      "Iteration: 1975, Train loss: -0.8909, rewards: 0.7091\n",
      "Iteration: 1980, Train loss: -0.9466, rewards: 0.6682\n",
      "Iteration: 1985, Train loss: -1.0023, rewards: 0.6820\n",
      "Iteration: 1990, Train loss: -0.9419, rewards: 0.6962\n",
      "Iteration: 1995, Train loss: -1.0247, rewards: 0.6819\n",
      "Iteration: 2000, Train loss: -0.9219, rewards: 0.6847\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6914\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personleadsorganization//test_beam/ ]\n",
      "Hits@1: 0.5259, Hits@3: 0.6810, Hits@10: 0.7629, MRR: 0.6144\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8506260289278488 (179 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 23:10:11,094]\u001b[0m Trial 2 finished with value: 0.8506260289278488 and parameters: {'lr': 0.002902551631944494, 'bs': 116, 'b': 0.2668309782078609, 'l': 0.0589140042498707, 'ee': 50}. Best is trial 0 with value: 0.8691002909875059.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.2856, rewards: 0.5395\n",
      "Iteration: 20, Train loss: -0.2231, rewards: 0.5683\n",
      "Iteration: 30, Train loss: -0.2591, rewards: 0.5822\n",
      "Iteration: 40, Train loss: -0.2242, rewards: 0.5871\n",
      "Iteration: 50, Train loss: -0.2806, rewards: 0.5680\n",
      "Iteration: 60, Train loss: -0.2360, rewards: 0.6206\n",
      "Iteration: 70, Train loss: -0.2430, rewards: 0.6247\n",
      "Iteration: 80, Train loss: -0.2293, rewards: 0.5838\n",
      "Iteration: 90, Train loss: -0.2275, rewards: 0.6150\n",
      "Iteration: 100, Train loss: -0.2647, rewards: 0.6223\n",
      "Eval:\n",
      "Hits@1: 0.6083, Hits@3: 0.6406, Hits@10: 0.6774, MRR: 0.6295\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.2544, rewards: 0.6371\n",
      "Iteration: 120, Train loss: -0.2458, rewards: 0.6404\n",
      "Iteration: 130, Train loss: -0.2168, rewards: 0.6485\n",
      "Iteration: 140, Train loss: -0.2330, rewards: 0.6293\n",
      "Iteration: 150, Train loss: -0.2948, rewards: 0.6463\n",
      "Iteration: 160, Train loss: -0.2459, rewards: 0.6163\n",
      "Iteration: 170, Train loss: -0.2238, rewards: 0.6113\n",
      "Iteration: 180, Train loss: -0.2584, rewards: 0.6150\n",
      "Iteration: 190, Train loss: -0.2629, rewards: 0.6042\n",
      "Iteration: 200, Train loss: -0.2497, rewards: 0.6020\n",
      "Eval:\n",
      "Hits@1: 0.5899, Hits@3: 0.6590, Hits@10: 0.6866, MRR: 0.6293\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.2449, rewards: 0.5561\n",
      "Iteration: 220, Train loss: -0.2673, rewards: 0.5956\n",
      "Iteration: 230, Train loss: -0.2178, rewards: 0.5821\n",
      "Iteration: 240, Train loss: -0.1872, rewards: 0.4880\n",
      "Iteration: 250, Train loss: -0.1857, rewards: 0.5944\n",
      "Iteration: 260, Train loss: -0.1704, rewards: 0.5536\n",
      "Iteration: 270, Train loss: -0.1136, rewards: 0.5944\n",
      "Iteration: 280, Train loss: -0.1220, rewards: 0.5874\n",
      "Iteration: 290, Train loss: -0.0676, rewards: 0.6073\n",
      "Iteration: 300, Train loss: -0.1216, rewards: 0.5665\n",
      "Eval:\n",
      "Hits@1: 0.5530, Hits@3: 0.6313, Hits@10: 0.6590, MRR: 0.5954\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.0704, rewards: 0.3890\n",
      "Iteration: 320, Train loss: -0.0000, rewards: 0.0008\n",
      "Iteration: 330, Train loss: -0.0002, rewards: 0.0031\n",
      "Iteration: 340, Train loss: -0.0004, rewards: 0.0008\n",
      "Iteration: 350, Train loss: -0.0015, rewards: 0.0071\n",
      "Iteration: 360, Train loss: -0.0015, rewards: 0.0252\n",
      "Iteration: 370, Train loss: -0.0005, rewards: 0.0291\n",
      "Iteration: 380, Train loss: 0.0006, rewards: 0.0157\n",
      "Iteration: 390, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 400, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.4747, Hits@10: 0.5576, MRR: 0.2384\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 420, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 430, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 440, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 450, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 460, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 470, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 480, Train loss: 0.0045, rewards: 0.1378\n",
      "Iteration: 490, Train loss: 0.0978, rewards: 0.5492\n",
      "Iteration: 500, Train loss: 0.1361, rewards: 0.5555\n",
      "Eval:\n",
      "Hits@1: 0.5668, Hits@3: 0.6313, Hits@10: 0.6636, MRR: 0.6047\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: 0.0815, rewards: 0.5610\n",
      "Iteration: 520, Train loss: 0.1139, rewards: 0.5758\n",
      "Iteration: 530, Train loss: 0.0625, rewards: 0.5855\n",
      "Iteration: 540, Train loss: 0.0278, rewards: 0.6055\n",
      "Iteration: 550, Train loss: 0.0298, rewards: 0.6097\n",
      "Iteration: 560, Train loss: 0.0304, rewards: 0.5978\n",
      "Iteration: 570, Train loss: 0.0502, rewards: 0.5683\n",
      "Iteration: 580, Train loss: 0.0481, rewards: 0.5897\n",
      "Iteration: 590, Train loss: 0.0578, rewards: 0.5997\n",
      "Iteration: 600, Train loss: 0.0647, rewards: 0.5902\n",
      "Eval:\n",
      "Hits@1: 0.6037, Hits@3: 0.6452, Hits@10: 0.6820, MRR: 0.6298\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: 0.0696, rewards: 0.6126\n",
      "Iteration: 620, Train loss: 0.0740, rewards: 0.5898\n",
      "Iteration: 630, Train loss: 0.0776, rewards: 0.5692\n",
      "Iteration: 640, Train loss: 0.1031, rewards: 0.6075\n",
      "Iteration: 650, Train loss: 0.1152, rewards: 0.5737\n",
      "Iteration: 660, Train loss: 0.1050, rewards: 0.5921\n",
      "Iteration: 670, Train loss: 0.0840, rewards: 0.6034\n",
      "Iteration: 680, Train loss: 0.0838, rewards: 0.5781\n",
      "Iteration: 690, Train loss: 0.0956, rewards: 0.6036\n",
      "Iteration: 700, Train loss: 0.0679, rewards: 0.6128\n",
      "Eval:\n",
      "Hits@1: 0.5991, Hits@3: 0.6313, Hits@10: 0.6728, MRR: 0.6228\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: 0.0735, rewards: 0.6078\n",
      "Iteration: 720, Train loss: 0.1045, rewards: 0.6239\n",
      "Iteration: 730, Train loss: 0.0873, rewards: 0.6249\n",
      "Iteration: 740, Train loss: 0.0669, rewards: 0.6376\n",
      "Iteration: 750, Train loss: 0.0857, rewards: 0.5929\n",
      "Iteration: 760, Train loss: 0.0692, rewards: 0.6085\n",
      "Iteration: 770, Train loss: 0.0899, rewards: 0.6141\n",
      "Iteration: 780, Train loss: 0.0950, rewards: 0.6246\n",
      "Iteration: 790, Train loss: 0.0905, rewards: 0.6198\n",
      "Iteration: 800, Train loss: 0.1118, rewards: 0.6098\n",
      "Eval:\n",
      "Hits@1: 0.6037, Hits@3: 0.6452, Hits@10: 0.6728, MRR: 0.6291\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: 0.1048, rewards: 0.5984\n",
      "Iteration: 820, Train loss: 0.0943, rewards: 0.6219\n",
      "Iteration: 830, Train loss: 0.0905, rewards: 0.6227\n",
      "Iteration: 840, Train loss: 0.0831, rewards: 0.6009\n",
      "Iteration: 850, Train loss: 0.0916, rewards: 0.5770\n",
      "Iteration: 860, Train loss: 0.1190, rewards: 0.6015\n",
      "Iteration: 870, Train loss: 0.1276, rewards: 0.6052\n",
      "Iteration: 880, Train loss: 0.0896, rewards: 0.6068\n",
      "Iteration: 890, Train loss: 0.1032, rewards: 0.6165\n",
      "Iteration: 900, Train loss: 0.1066, rewards: 0.6014\n",
      "Eval:\n",
      "Hits@1: 0.6083, Hits@3: 0.6359, Hits@10: 0.6682, MRR: 0.6277\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: 0.1103, rewards: 0.6244\n",
      "Iteration: 920, Train loss: 0.1067, rewards: 0.5930\n",
      "Iteration: 930, Train loss: 0.1102, rewards: 0.6110\n",
      "Iteration: 940, Train loss: 0.1084, rewards: 0.6146\n",
      "Iteration: 950, Train loss: 0.1189, rewards: 0.6220\n",
      "Iteration: 960, Train loss: 0.1143, rewards: 0.6307\n",
      "Iteration: 970, Train loss: 0.1227, rewards: 0.5985\n",
      "Iteration: 980, Train loss: 0.0882, rewards: 0.6206\n",
      "Iteration: 990, Train loss: 0.0877, rewards: 0.6224\n",
      "Iteration: 1000, Train loss: 0.0957, rewards: 0.6253\n",
      "Eval:\n",
      "Hits@1: 0.6083, Hits@3: 0.6313, Hits@10: 0.6636, MRR: 0.6259\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: 0.0907, rewards: 0.5890\n",
      "Iteration: 1020, Train loss: 0.1075, rewards: 0.6411\n",
      "Iteration: 1030, Train loss: 0.1104, rewards: 0.6165\n",
      "Iteration: 1040, Train loss: 0.1052, rewards: 0.6119\n",
      "Iteration: 1050, Train loss: 0.1023, rewards: 0.6313\n",
      "Iteration: 1060, Train loss: 0.1203, rewards: 0.6172\n",
      "Iteration: 1070, Train loss: 0.0912, rewards: 0.6198\n",
      "Iteration: 1080, Train loss: 0.0896, rewards: 0.6392\n",
      "Iteration: 1090, Train loss: 0.1001, rewards: 0.6227\n",
      "Iteration: 1100, Train loss: 0.1195, rewards: 0.6129\n",
      "Eval:\n",
      "Hits@1: 0.6129, Hits@3: 0.6498, Hits@10: 0.6682, MRR: 0.6334\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: 0.1316, rewards: 0.6520\n",
      "Iteration: 1120, Train loss: 0.1074, rewards: 0.6385\n",
      "Iteration: 1130, Train loss: 0.1096, rewards: 0.6127\n",
      "Iteration: 1140, Train loss: 0.1165, rewards: 0.6124\n",
      "Iteration: 1150, Train loss: 0.1200, rewards: 0.6465\n",
      "Iteration: 1160, Train loss: 0.1112, rewards: 0.6439\n",
      "Iteration: 1170, Train loss: 0.1175, rewards: 0.6203\n",
      "Iteration: 1180, Train loss: 0.1082, rewards: 0.6561\n",
      "Iteration: 1190, Train loss: 0.1172, rewards: 0.6323\n",
      "Iteration: 1200, Train loss: 0.1195, rewards: 0.6152\n",
      "Eval:\n",
      "Hits@1: 0.6175, Hits@3: 0.6544, Hits@10: 0.6820, MRR: 0.6386\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: 0.1207, rewards: 0.6283\n",
      "Iteration: 1220, Train loss: 0.1257, rewards: 0.6402\n",
      "Iteration: 1230, Train loss: 0.1220, rewards: 0.6134\n",
      "Iteration: 1240, Train loss: 0.1270, rewards: 0.6407\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1250, Train loss: 0.1169, rewards: 0.6342\n",
      "Iteration: 1260, Train loss: 0.1028, rewards: 0.6350\n",
      "Iteration: 1270, Train loss: 0.1285, rewards: 0.6259\n",
      "Iteration: 1280, Train loss: 0.1182, rewards: 0.6296\n",
      "Iteration: 1290, Train loss: 0.1080, rewards: 0.6423\n",
      "Iteration: 1300, Train loss: 0.1157, rewards: 0.6383\n",
      "Eval:\n",
      "Hits@1: 0.6221, Hits@3: 0.6498, Hits@10: 0.6774, MRR: 0.6398\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: 0.1178, rewards: 0.6272\n",
      "Iteration: 1320, Train loss: 0.1253, rewards: 0.6070\n",
      "Iteration: 1330, Train loss: 0.1051, rewards: 0.6425\n",
      "Iteration: 1340, Train loss: 0.1254, rewards: 0.6370\n",
      "Iteration: 1350, Train loss: 0.1264, rewards: 0.6219\n",
      "Iteration: 1360, Train loss: 0.1167, rewards: 0.6055\n",
      "Iteration: 1370, Train loss: 0.1268, rewards: 0.6503\n",
      "Iteration: 1380, Train loss: 0.1227, rewards: 0.6290\n",
      "Iteration: 1390, Train loss: 0.1179, rewards: 0.6409\n",
      "Iteration: 1400, Train loss: 0.1171, rewards: 0.6329\n",
      "Eval:\n",
      "Hits@1: 0.6221, Hits@3: 0.6452, Hits@10: 0.6728, MRR: 0.6379\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: 0.1276, rewards: 0.6363\n",
      "Iteration: 1420, Train loss: 0.1444, rewards: 0.6335\n",
      "Iteration: 1430, Train loss: 0.1642, rewards: 0.6607\n",
      "Iteration: 1440, Train loss: 0.1460, rewards: 0.6459\n",
      "Iteration: 1450, Train loss: 0.1410, rewards: 0.6486\n",
      "Iteration: 1460, Train loss: 0.1546, rewards: 0.6543\n",
      "Iteration: 1470, Train loss: 0.1654, rewards: 0.6235\n",
      "Iteration: 1480, Train loss: 0.1522, rewards: 0.6298\n",
      "Iteration: 1490, Train loss: 0.1555, rewards: 0.6407\n",
      "Iteration: 1500, Train loss: 0.1440, rewards: 0.6357\n",
      "Eval:\n",
      "Hits@1: 0.6175, Hits@3: 0.6498, Hits@10: 0.6728, MRR: 0.6377\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: 0.1499, rewards: 0.6329\n",
      "Iteration: 1520, Train loss: 0.1590, rewards: 0.6472\n",
      "Iteration: 1530, Train loss: 0.1576, rewards: 0.6407\n",
      "Iteration: 1540, Train loss: 0.1521, rewards: 0.6343\n",
      "Iteration: 1550, Train loss: 0.1370, rewards: 0.6297\n",
      "Iteration: 1560, Train loss: 0.1282, rewards: 0.6411\n",
      "Iteration: 1570, Train loss: 0.1599, rewards: 0.6507\n",
      "Iteration: 1580, Train loss: 0.1261, rewards: 0.6415\n",
      "Iteration: 1590, Train loss: 0.0995, rewards: 0.6300\n",
      "Iteration: 1600, Train loss: 0.1247, rewards: 0.6384\n",
      "Eval:\n",
      "Hits@1: 0.6267, Hits@3: 0.6498, Hits@10: 0.6866, MRR: 0.6444\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: 0.1493, rewards: 0.6584\n",
      "Iteration: 1620, Train loss: 0.1624, rewards: 0.6626\n",
      "Iteration: 1630, Train loss: 0.1329, rewards: 0.6621\n",
      "Iteration: 1640, Train loss: 0.1492, rewards: 0.6592\n",
      "Iteration: 1650, Train loss: 0.1353, rewards: 0.6603\n",
      "Iteration: 1660, Train loss: 0.1201, rewards: 0.6698\n",
      "Iteration: 1670, Train loss: 0.1166, rewards: 0.6759\n",
      "Iteration: 1680, Train loss: 0.0492, rewards: 0.5124\n",
      "Iteration: 1690, Train loss: 0.0944, rewards: 0.3967\n",
      "Iteration: 1700, Train loss: 0.0633, rewards: 0.6137\n",
      "Eval:\n",
      "Hits@1: 0.6129, Hits@3: 0.6636, Hits@10: 0.6866, MRR: 0.6410\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: 0.0354, rewards: 0.5939\n",
      "Iteration: 1720, Train loss: 0.0077, rewards: 0.6169\n",
      "Iteration: 1730, Train loss: 0.0076, rewards: 0.6151\n",
      "Iteration: 1740, Train loss: -0.0024, rewards: 0.5111\n",
      "Iteration: 1750, Train loss: -0.0170, rewards: 0.4784\n",
      "Iteration: 1760, Train loss: -0.0025, rewards: 0.5452\n",
      "Iteration: 1770, Train loss: 0.0417, rewards: 0.5908\n",
      "Iteration: 1780, Train loss: 0.0372, rewards: 0.5965\n",
      "Iteration: 1790, Train loss: 0.0182, rewards: 0.6179\n",
      "Iteration: 1800, Train loss: 0.0346, rewards: 0.6120\n",
      "Eval:\n",
      "Hits@1: 0.5991, Hits@3: 0.6636, Hits@10: 0.6912, MRR: 0.6350\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: 0.0642, rewards: 0.6220\n",
      "Iteration: 1820, Train loss: 0.0509, rewards: 0.6235\n",
      "Iteration: 1830, Train loss: 0.0421, rewards: 0.5913\n",
      "Iteration: 1840, Train loss: 0.0355, rewards: 0.5898\n",
      "Iteration: 1850, Train loss: 0.0223, rewards: 0.4834\n",
      "Iteration: 1860, Train loss: 0.0837, rewards: 0.5154\n",
      "Iteration: 1870, Train loss: 0.1343, rewards: 0.6167\n",
      "Iteration: 1880, Train loss: 0.1256, rewards: 0.6113\n",
      "Iteration: 1890, Train loss: 0.1018, rewards: 0.6039\n",
      "Iteration: 1900, Train loss: 0.1018, rewards: 0.6195\n",
      "Eval:\n",
      "Hits@1: 0.5899, Hits@3: 0.6544, Hits@10: 0.6774, MRR: 0.6252\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: 0.1064, rewards: 0.6064\n",
      "Iteration: 1920, Train loss: 0.1529, rewards: 0.6121\n",
      "Iteration: 1930, Train loss: 0.1656, rewards: 0.6260\n",
      "Iteration: 1940, Train loss: 0.1701, rewards: 0.6258\n",
      "Iteration: 1950, Train loss: 0.1575, rewards: 0.6046\n",
      "Iteration: 1960, Train loss: 0.1484, rewards: 0.6285\n",
      "Iteration: 1970, Train loss: 0.1797, rewards: 0.6102\n",
      "Iteration: 1980, Train loss: 0.1661, rewards: 0.6205\n",
      "Iteration: 1990, Train loss: 0.1744, rewards: 0.6307\n",
      "Iteration: 2000, Train loss: 0.1529, rewards: 0.6323\n",
      "Eval:\n",
      "Hits@1: 0.5945, Hits@3: 0.6590, Hits@10: 0.6820, MRR: 0.6299\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/personleadsorganization//test_beam/ ]\n",
      "Hits@1: 0.6207, Hits@3: 0.7112, Hits@10: 0.7629, MRR: 0.6734\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8633505654498226 (179 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-29 00:17:31,154]\u001b[0m Trial 3 finished with value: 0.8633505654498226 and parameters: {'lr': 0.0019521325083512431, 'bs': 127, 'b': 0.016728341237345012, 'l': 0.24373179849518972, 'ee': 100}. Best is trial 0 with value: 0.8691002909875059.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 1, Train loss: -0.5094, rewards: 0.5387\n",
      "Iteration: 2, Train loss: -0.1307, rewards: 0.1631\n",
      "Iteration: 3, Train loss: -0.7008, rewards: 0.3196\n",
      "Iteration: 4, Train loss: -0.3047, rewards: 0.1649\n",
      "Iteration: 5, Train loss: -0.4661, rewards: 0.4381\n",
      "Iteration: 6, Train loss: -0.3979, rewards: 0.4446\n",
      "Iteration: 7, Train loss: -0.2771, rewards: 0.4411\n",
      "Iteration: 8, Train loss: -0.4495, rewards: 0.4637\n",
      "Iteration: 9, Train loss: -0.5798, rewards: 0.4113\n",
      "Iteration: 10, Train loss: -0.5522, rewards: 0.4863\n",
      "Eval:\n",
      "Hits@1: 0.4931, Hits@3: 0.6083, Hits@10: 0.6452, MRR: 0.5583\n",
      "------------------------------------------------------------\n",
      "Iteration: 11, Train loss: -0.4467, rewards: 0.5589\n",
      "Iteration: 12, Train loss: -0.5554, rewards: 0.4994\n",
      "Iteration: 13, Train loss: -0.5622, rewards: 0.3673\n",
      "Iteration: 14, Train loss: -0.6459, rewards: 0.3577\n",
      "Iteration: 15, Train loss: -0.5537, rewards: 0.5274\n",
      "Iteration: 16, Train loss: -0.4768, rewards: 0.6286\n",
      "Iteration: 17, Train loss: -0.5868, rewards: 0.5470\n",
      "Iteration: 18, Train loss: -0.4609, rewards: 0.5726\n",
      "Iteration: 19, Train loss: -0.5339, rewards: 0.5792\n",
      "Iteration: 20, Train loss: -0.7290, rewards: 0.4149\n",
      "Eval:\n",
      "Hits@1: 0.5760, Hits@3: 0.6636, Hits@10: 0.6820, MRR: 0.6194\n",
      "------------------------------------------------------------\n",
      "Iteration: 21, Train loss: -0.5861, rewards: 0.4708\n",
      "Iteration: 22, Train loss: -0.5978, rewards: 0.5214\n",
      "Iteration: 23, Train loss: -0.4856, rewards: 0.5768\n",
      "Iteration: 24, Train loss: -0.5954, rewards: 0.6131\n",
      "Iteration: 25, Train loss: -0.6748, rewards: 0.6000\n",
      "Iteration: 26, Train loss: -0.5737, rewards: 0.5476\n",
      "Iteration: 27, Train loss: -0.5803, rewards: 0.5006\n",
      "Iteration: 28, Train loss: -0.5325, rewards: 0.5274\n",
      "Iteration: 29, Train loss: -0.5075, rewards: 0.5107\n",
      "Iteration: 30, Train loss: -0.5086, rewards: 0.5333\n",
      "Eval:\n",
      "Hits@1: 0.5484, Hits@3: 0.6498, Hits@10: 0.6774, MRR: 0.5991\n",
      "------------------------------------------------------------\n",
      "Iteration: 31, Train loss: -0.4026, rewards: 0.5060\n",
      "Iteration: 32, Train loss: -0.4708, rewards: 0.5363\n",
      "Iteration: 33, Train loss: -0.4120, rewards: 0.5137\n",
      "Iteration: 34, Train loss: -0.3999, rewards: 0.5423\n",
      "Iteration: 35, Train loss: -0.2832, rewards: 0.5571\n",
      "Iteration: 36, Train loss: -0.5877, rewards: 0.6149\n",
      "Iteration: 37, Train loss: -0.5193, rewards: 0.5976\n",
      "Iteration: 38, Train loss: -0.4484, rewards: 0.6310\n",
      "Iteration: 39, Train loss: -0.3737, rewards: 0.5923\n",
      "Iteration: 40, Train loss: -0.4679, rewards: 0.6327\n",
      "Eval:\n",
      "Hits@1: 0.6313, Hits@3: 0.6682, Hits@10: 0.6866, MRR: 0.6539\n",
      "------------------------------------------------------------\n",
      "Iteration: 41, Train loss: -0.3318, rewards: 0.6411\n",
      "Iteration: 42, Train loss: -0.5178, rewards: 0.4845\n",
      "Iteration: 43, Train loss: -0.4034, rewards: 0.6399\n",
      "Iteration: 44, Train loss: -0.5370, rewards: 0.5792\n",
      "Iteration: 45, Train loss: -0.5676, rewards: 0.6077\n",
      "Iteration: 46, Train loss: -0.4763, rewards: 0.5315\n",
      "Iteration: 47, Train loss: -0.6035, rewards: 0.5560\n",
      "Iteration: 48, Train loss: -0.6125, rewards: 0.5619\n",
      "Iteration: 49, Train loss: -0.4917, rewards: 0.6458\n",
      "Iteration: 50, Train loss: -0.5207, rewards: 0.6690\n",
      "Eval:\n",
      "Hits@1: 0.6544, Hits@3: 0.6820, Hits@10: 0.6866, MRR: 0.6681\n",
      "------------------------------------------------------------\n",
      "Iteration: 51, Train loss: -0.3587, rewards: 0.6744\n",
      "Iteration: 52, Train loss: -0.2861, rewards: 0.6851\n",
      "Iteration: 53, Train loss: -0.3496, rewards: 0.6232\n",
      "Iteration: 54, Train loss: -0.2689, rewards: 0.6637\n",
      "Iteration: 55, Train loss: -0.2469, rewards: 0.5667\n",
      "Iteration: 56, Train loss: -0.4246, rewards: 0.6673\n",
      "Iteration: 57, Train loss: -0.4013, rewards: 0.6542\n",
      "Iteration: 58, Train loss: -0.3389, rewards: 0.5560\n",
      "Iteration: 59, Train loss: -0.2927, rewards: 0.6542\n",
      "Iteration: 60, Train loss: -0.5003, rewards: 0.5423\n",
      "Eval:\n",
      "Hits@1: 0.6406, Hits@3: 0.6774, Hits@10: 0.6912, MRR: 0.6602\n",
      "------------------------------------------------------------\n",
      "Iteration: 61, Train loss: -0.4560, rewards: 0.6917\n",
      "Iteration: 62, Train loss: -0.4581, rewards: 0.6054\n",
      "Iteration: 63, Train loss: -0.4587, rewards: 0.5327\n",
      "Iteration: 64, Train loss: -0.3019, rewards: 0.5619\n",
      "Iteration: 65, Train loss: -0.4816, rewards: 0.7012\n",
      "Iteration: 66, Train loss: -0.3891, rewards: 0.6536\n",
      "Iteration: 67, Train loss: -0.5411, rewards: 0.6637\n",
      "Iteration: 68, Train loss: -0.5433, rewards: 0.5470\n",
      "Iteration: 69, Train loss: -0.4851, rewards: 0.6464\n",
      "Iteration: 70, Train loss: -0.5520, rewards: 0.6286\n",
      "Eval:\n",
      "Hits@1: 0.6590, Hits@3: 0.6866, Hits@10: 0.6866, MRR: 0.6734\n",
      "------------------------------------------------------------\n",
      "Iteration: 71, Train loss: -0.5418, rewards: 0.5625\n",
      "Iteration: 72, Train loss: -0.4362, rewards: 0.6065\n",
      "Iteration: 73, Train loss: -0.4150, rewards: 0.6179\n",
      "Iteration: 74, Train loss: -0.4434, rewards: 0.6601\n",
      "Iteration: 75, Train loss: -0.4997, rewards: 0.6125\n",
      "Iteration: 76, Train loss: -0.4845, rewards: 0.6173\n",
      "Iteration: 77, Train loss: -0.2306, rewards: 0.6685\n",
      "Iteration: 78, Train loss: -0.5289, rewards: 0.5881\n",
      "Iteration: 79, Train loss: -0.3660, rewards: 0.6506\n",
      "Iteration: 80, Train loss: -0.3457, rewards: 0.6595\n",
      "Eval:\n",
      "Hits@1: 0.6682, Hits@3: 0.6866, Hits@10: 0.6866, MRR: 0.6773\n",
      "------------------------------------------------------------\n",
      "Iteration: 81, Train loss: -0.5274, rewards: 0.6101\n",
      "Iteration: 82, Train loss: -0.5050, rewards: 0.6452\n",
      "Iteration: 83, Train loss: -0.3162, rewards: 0.6315\n",
      "Iteration: 84, Train loss: -0.3077, rewards: 0.6744\n",
      "Iteration: 85, Train loss: -0.3789, rewards: 0.6899\n",
      "Iteration: 86, Train loss: -0.4349, rewards: 0.6232\n",
      "Iteration: 87, Train loss: -0.3783, rewards: 0.5994\n",
      "Iteration: 88, Train loss: -0.4453, rewards: 0.6613\n",
      "Iteration: 89, Train loss: -0.4448, rewards: 0.5863\n",
      "Iteration: 90, Train loss: -0.4017, rewards: 0.6708\n",
      "Eval:\n",
      "Hits@1: 0.6728, Hits@3: 0.6866, Hits@10: 0.6959, MRR: 0.6813\n",
      "------------------------------------------------------------\n",
      "Iteration: 91, Train loss: -0.5478, rewards: 0.6101\n",
      "Iteration: 92, Train loss: -0.4810, rewards: 0.6137\n",
      "Iteration: 93, Train loss: -0.3720, rewards: 0.5673\n",
      "Iteration: 94, Train loss: -0.2698, rewards: 0.6339\n",
      "Iteration: 95, Train loss: -0.4103, rewards: 0.6667\n",
      "Iteration: 96, Train loss: -0.3307, rewards: 0.6411\n",
      "Iteration: 97, Train loss: -0.5753, rewards: 0.5565\n",
      "Iteration: 98, Train loss: -0.4933, rewards: 0.6595\n",
      "Iteration: 99, Train loss: -0.5361, rewards: 0.5839\n",
      "Iteration: 100, Train loss: -0.4239, rewards: 0.7077\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6959, MRR: 0.6885\n",
      "------------------------------------------------------------\n",
      "Iteration: 101, Train loss: -0.5325, rewards: 0.5762\n",
      "Iteration: 102, Train loss: -0.4298, rewards: 0.6815\n",
      "Iteration: 103, Train loss: -0.6538, rewards: 0.6256\n",
      "Iteration: 104, Train loss: -0.5194, rewards: 0.6077\n",
      "Iteration: 105, Train loss: -0.5057, rewards: 0.5417\n",
      "Iteration: 106, Train loss: -0.5728, rewards: 0.6583\n",
      "Iteration: 107, Train loss: -0.4727, rewards: 0.6911\n",
      "Iteration: 108, Train loss: -0.5255, rewards: 0.6440\n",
      "Iteration: 109, Train loss: -0.6124, rewards: 0.5649\n",
      "Iteration: 110, Train loss: -0.5466, rewards: 0.5887\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.6912, MRR: 0.6872\n",
      "------------------------------------------------------------\n",
      "Iteration: 111, Train loss: -0.3795, rewards: 0.6536\n",
      "Iteration: 112, Train loss: -0.5194, rewards: 0.6702\n",
      "Iteration: 113, Train loss: -0.6602, rewards: 0.6452\n",
      "Iteration: 114, Train loss: -0.0743, rewards: 0.7113\n",
      "Iteration: 115, Train loss: -0.4260, rewards: 0.6012\n",
      "Iteration: 116, Train loss: -0.3886, rewards: 0.6512\n",
      "Iteration: 117, Train loss: -0.5100, rewards: 0.6399\n",
      "Iteration: 118, Train loss: -0.5331, rewards: 0.6262\n",
      "Iteration: 119, Train loss: -0.6265, rewards: 0.5923\n",
      "Iteration: 120, Train loss: -0.5973, rewards: 0.5780\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6912, Hits@10: 0.7005, MRR: 0.6887\n",
      "------------------------------------------------------------\n",
      "Iteration: 121, Train loss: -0.6552, rewards: 0.5911\n",
      "Iteration: 122, Train loss: -0.5402, rewards: 0.6482\n",
      "Iteration: 123, Train loss: -0.5553, rewards: 0.6280\n",
      "Iteration: 124, Train loss: -0.4991, rewards: 0.5810\n",
      "Iteration: 125, Train loss: -0.5193, rewards: 0.6429\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 126, Train loss: -0.5527, rewards: 0.7006\n",
      "Iteration: 127, Train loss: -0.5545, rewards: 0.6202\n",
      "Iteration: 128, Train loss: -0.5003, rewards: 0.6321\n",
      "Iteration: 129, Train loss: -0.4804, rewards: 0.6470\n",
      "Iteration: 130, Train loss: -0.5244, rewards: 0.6536\n",
      "Eval:\n",
      "Hits@1: 0.6820, Hits@3: 0.6959, Hits@10: 0.7051, MRR: 0.6894\n",
      "------------------------------------------------------------\n",
      "Iteration: 131, Train loss: -0.4397, rewards: 0.7214\n",
      "Iteration: 132, Train loss: -0.4955, rewards: 0.5768\n",
      "Iteration: 133, Train loss: -0.3504, rewards: 0.5625\n",
      "Iteration: 134, Train loss: -0.6144, rewards: 0.6875\n",
      "Iteration: 135, Train loss: -0.5510, rewards: 0.5256\n",
      "Iteration: 136, Train loss: -0.4343, rewards: 0.6095\n",
      "Iteration: 137, Train loss: -0.5063, rewards: 0.6429\n",
      "Iteration: 138, Train loss: -0.5420, rewards: 0.7089\n",
      "Iteration: 139, Train loss: -0.7116, rewards: 0.6077\n",
      "Iteration: 140, Train loss: -0.6103, rewards: 0.6905\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.6982\n",
      "------------------------------------------------------------\n",
      "Iteration: 141, Train loss: -0.5920, rewards: 0.5875\n",
      "Iteration: 142, Train loss: -0.5348, rewards: 0.6101\n",
      "Iteration: 143, Train loss: -0.4620, rewards: 0.6339\n",
      "Iteration: 144, Train loss: -0.4749, rewards: 0.6696\n",
      "Iteration: 145, Train loss: -0.3983, rewards: 0.6113\n",
      "Iteration: 146, Train loss: -0.4245, rewards: 0.6762\n",
      "Iteration: 147, Train loss: -0.4455, rewards: 0.7179\n",
      "Iteration: 148, Train loss: -0.4301, rewards: 0.6631\n",
      "Iteration: 149, Train loss: -0.5315, rewards: 0.7315\n",
      "Iteration: 150, Train loss: -0.3001, rewards: 0.6750\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7028\n",
      "------------------------------------------------------------\n",
      "Iteration: 151, Train loss: -0.3853, rewards: 0.6036\n",
      "Iteration: 152, Train loss: -0.4702, rewards: 0.7036\n",
      "Iteration: 153, Train loss: -0.4630, rewards: 0.6821\n",
      "Iteration: 154, Train loss: -0.4686, rewards: 0.6476\n",
      "Iteration: 155, Train loss: -0.4194, rewards: 0.7470\n",
      "Iteration: 156, Train loss: -0.5864, rewards: 0.6167\n",
      "Iteration: 157, Train loss: -0.4612, rewards: 0.6613\n",
      "Iteration: 158, Train loss: -0.4724, rewards: 0.6815\n",
      "Iteration: 159, Train loss: -0.3813, rewards: 0.7048\n",
      "Iteration: 160, Train loss: -0.4633, rewards: 0.7256\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7051\n",
      "------------------------------------------------------------\n",
      "Iteration: 161, Train loss: -0.4287, rewards: 0.6637\n",
      "Iteration: 162, Train loss: -0.5779, rewards: 0.6857\n",
      "Iteration: 163, Train loss: -0.5787, rewards: 0.6083\n",
      "Iteration: 164, Train loss: -0.4135, rewards: 0.7357\n",
      "Iteration: 165, Train loss: -0.4585, rewards: 0.7435\n",
      "Iteration: 166, Train loss: -0.4936, rewards: 0.6381\n",
      "Iteration: 167, Train loss: -0.5262, rewards: 0.6720\n",
      "Iteration: 168, Train loss: -0.6470, rewards: 0.6792\n",
      "Iteration: 169, Train loss: -0.6042, rewards: 0.6577\n",
      "Iteration: 170, Train loss: -0.5526, rewards: 0.6643\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7043\n",
      "------------------------------------------------------------\n",
      "Iteration: 171, Train loss: -0.6160, rewards: 0.7363\n",
      "Iteration: 172, Train loss: -0.5281, rewards: 0.6113\n",
      "Iteration: 173, Train loss: -0.4954, rewards: 0.6899\n",
      "Iteration: 174, Train loss: -0.4263, rewards: 0.7643\n",
      "Iteration: 175, Train loss: -0.3321, rewards: 0.7256\n",
      "Iteration: 176, Train loss: -0.4400, rewards: 0.6440\n",
      "Iteration: 177, Train loss: -0.2707, rewards: 0.5470\n",
      "Iteration: 178, Train loss: -0.3410, rewards: 0.7702\n",
      "Iteration: 179, Train loss: -0.3976, rewards: 0.6226\n",
      "Iteration: 180, Train loss: -0.2836, rewards: 0.7030\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7051\n",
      "------------------------------------------------------------\n",
      "Iteration: 181, Train loss: -0.3564, rewards: 0.6643\n",
      "Iteration: 182, Train loss: -0.3597, rewards: 0.6298\n",
      "Iteration: 183, Train loss: -0.4604, rewards: 0.7500\n",
      "Iteration: 184, Train loss: -0.5516, rewards: 0.6577\n",
      "Iteration: 185, Train loss: -0.4238, rewards: 0.6935\n",
      "Iteration: 186, Train loss: -0.3740, rewards: 0.7167\n",
      "Iteration: 187, Train loss: -0.4879, rewards: 0.6708\n",
      "Iteration: 188, Train loss: -0.3874, rewards: 0.6589\n",
      "Iteration: 189, Train loss: -0.4178, rewards: 0.7494\n",
      "Iteration: 190, Train loss: -0.5609, rewards: 0.7738\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7037\n",
      "------------------------------------------------------------\n",
      "Iteration: 191, Train loss: -0.4169, rewards: 0.7637\n",
      "Iteration: 192, Train loss: -0.3876, rewards: 0.6619\n",
      "Iteration: 193, Train loss: -0.2827, rewards: 0.7440\n",
      "Iteration: 194, Train loss: -0.3719, rewards: 0.6667\n",
      "Iteration: 195, Train loss: -0.3593, rewards: 0.6607\n",
      "Iteration: 196, Train loss: -0.2979, rewards: 0.7827\n",
      "Iteration: 197, Train loss: -0.4673, rewards: 0.6482\n",
      "Iteration: 198, Train loss: -0.4501, rewards: 0.6702\n",
      "Iteration: 199, Train loss: -0.3441, rewards: 0.6833\n",
      "Iteration: 200, Train loss: -0.4027, rewards: 0.6964\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7029\n",
      "------------------------------------------------------------\n",
      "Iteration: 201, Train loss: -0.2340, rewards: 0.7232\n",
      "Iteration: 202, Train loss: -0.4012, rewards: 0.6863\n",
      "Iteration: 203, Train loss: -0.3879, rewards: 0.6470\n",
      "Iteration: 204, Train loss: -0.2722, rewards: 0.6946\n",
      "Iteration: 205, Train loss: -0.3515, rewards: 0.7030\n",
      "Iteration: 206, Train loss: -0.4373, rewards: 0.6649\n",
      "Iteration: 207, Train loss: -0.4819, rewards: 0.7625\n",
      "Iteration: 208, Train loss: -0.4919, rewards: 0.6970\n",
      "Iteration: 209, Train loss: -0.4869, rewards: 0.6036\n",
      "Iteration: 210, Train loss: -0.4614, rewards: 0.6679\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7034\n",
      "------------------------------------------------------------\n",
      "Iteration: 211, Train loss: -0.4069, rewards: 0.7911\n",
      "Iteration: 212, Train loss: -0.2702, rewards: 0.6958\n",
      "Iteration: 213, Train loss: -0.5155, rewards: 0.6708\n",
      "Iteration: 214, Train loss: -0.3139, rewards: 0.6589\n",
      "Iteration: 215, Train loss: -0.4004, rewards: 0.7083\n",
      "Iteration: 216, Train loss: -0.4575, rewards: 0.6268\n",
      "Iteration: 217, Train loss: -0.5073, rewards: 0.6589\n",
      "Iteration: 218, Train loss: -0.4395, rewards: 0.6952\n",
      "Iteration: 219, Train loss: -0.6332, rewards: 0.6458\n",
      "Iteration: 220, Train loss: -0.6145, rewards: 0.6970\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7033\n",
      "------------------------------------------------------------\n",
      "Iteration: 221, Train loss: -0.7387, rewards: 0.7077\n",
      "Iteration: 222, Train loss: -0.4082, rewards: 0.6798\n",
      "Iteration: 223, Train loss: -0.4764, rewards: 0.7298\n",
      "Iteration: 224, Train loss: -0.4695, rewards: 0.6440\n",
      "Iteration: 225, Train loss: -0.5153, rewards: 0.6839\n",
      "Iteration: 226, Train loss: -0.5358, rewards: 0.7315\n",
      "Iteration: 227, Train loss: -0.4306, rewards: 0.6625\n",
      "Iteration: 228, Train loss: -0.2159, rewards: 0.7065\n",
      "Iteration: 229, Train loss: -0.3325, rewards: 0.7375\n",
      "Iteration: 230, Train loss: -0.3487, rewards: 0.7417\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7052\n",
      "------------------------------------------------------------\n",
      "Iteration: 231, Train loss: -0.4303, rewards: 0.7458\n",
      "Iteration: 232, Train loss: -0.4247, rewards: 0.6065\n",
      "Iteration: 233, Train loss: -0.4109, rewards: 0.5905\n",
      "Iteration: 234, Train loss: -0.2889, rewards: 0.6720\n",
      "Iteration: 235, Train loss: -0.3887, rewards: 0.6339\n",
      "Iteration: 236, Train loss: -0.3262, rewards: 0.6518\n",
      "Iteration: 237, Train loss: -0.4875, rewards: 0.6595\n",
      "Iteration: 238, Train loss: -0.5065, rewards: 0.6958\n",
      "Iteration: 239, Train loss: -0.5926, rewards: 0.6310\n",
      "Iteration: 240, Train loss: -0.5909, rewards: 0.6173\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7037\n",
      "------------------------------------------------------------\n",
      "Iteration: 241, Train loss: -0.6728, rewards: 0.6298\n",
      "Iteration: 242, Train loss: -0.6050, rewards: 0.6512\n",
      "Iteration: 243, Train loss: -0.5353, rewards: 0.6863\n",
      "Iteration: 244, Train loss: -0.4188, rewards: 0.6214\n",
      "Iteration: 245, Train loss: -0.3476, rewards: 0.6679\n",
      "Iteration: 246, Train loss: -0.3989, rewards: 0.7173\n",
      "Iteration: 247, Train loss: -0.4480, rewards: 0.7542\n",
      "Iteration: 248, Train loss: -0.4809, rewards: 0.7500\n",
      "Iteration: 249, Train loss: -0.4156, rewards: 0.6940\n",
      "Iteration: 250, Train loss: -0.5429, rewards: 0.6810\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7057\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 251, Train loss: -0.3675, rewards: 0.7238\n",
      "Iteration: 252, Train loss: -0.3554, rewards: 0.7583\n",
      "Iteration: 253, Train loss: -0.5169, rewards: 0.6131\n",
      "Iteration: 254, Train loss: -0.1842, rewards: 0.7548\n",
      "Iteration: 255, Train loss: -0.3032, rewards: 0.6940\n",
      "Iteration: 256, Train loss: -0.3834, rewards: 0.7333\n",
      "Iteration: 257, Train loss: -0.3897, rewards: 0.7661\n",
      "Iteration: 258, Train loss: -0.5166, rewards: 0.6827\n",
      "Iteration: 259, Train loss: -0.4682, rewards: 0.7202\n",
      "Iteration: 260, Train loss: -0.3002, rewards: 0.6964\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7005\n",
      "------------------------------------------------------------\n",
      "Iteration: 261, Train loss: -0.5181, rewards: 0.7196\n",
      "Iteration: 262, Train loss: -0.4115, rewards: 0.7625\n",
      "Iteration: 263, Train loss: -0.4588, rewards: 0.5851\n",
      "Iteration: 264, Train loss: -0.2331, rewards: 0.7220\n",
      "Iteration: 265, Train loss: -0.3317, rewards: 0.7875\n",
      "Iteration: 266, Train loss: -0.3843, rewards: 0.6792\n",
      "Iteration: 267, Train loss: -0.4915, rewards: 0.7214\n",
      "Iteration: 268, Train loss: -0.3178, rewards: 0.7036\n",
      "Iteration: 269, Train loss: -0.3570, rewards: 0.6393\n",
      "Iteration: 270, Train loss: -0.4632, rewards: 0.7601\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.7014\n",
      "------------------------------------------------------------\n",
      "Iteration: 271, Train loss: -0.3802, rewards: 0.6464\n",
      "Iteration: 272, Train loss: -0.2434, rewards: 0.7048\n",
      "Iteration: 273, Train loss: -0.3566, rewards: 0.7738\n",
      "Iteration: 274, Train loss: -0.4513, rewards: 0.7167\n",
      "Iteration: 275, Train loss: -0.4386, rewards: 0.6429\n",
      "Iteration: 276, Train loss: -0.4977, rewards: 0.7423\n",
      "Iteration: 277, Train loss: -0.5365, rewards: 0.6470\n",
      "Iteration: 278, Train loss: -0.4801, rewards: 0.6310\n",
      "Iteration: 279, Train loss: -0.4868, rewards: 0.6339\n",
      "Iteration: 280, Train loss: -0.3745, rewards: 0.7155\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7035\n",
      "------------------------------------------------------------\n",
      "Iteration: 281, Train loss: -0.5418, rewards: 0.6685\n",
      "Iteration: 282, Train loss: -0.4391, rewards: 0.7530\n",
      "Iteration: 283, Train loss: -0.2521, rewards: 0.6929\n",
      "Iteration: 284, Train loss: -0.2881, rewards: 0.6655\n",
      "Iteration: 285, Train loss: -0.3146, rewards: 0.7411\n",
      "Iteration: 286, Train loss: -0.3786, rewards: 0.6161\n",
      "Iteration: 287, Train loss: -0.3356, rewards: 0.6190\n",
      "Iteration: 288, Train loss: -0.5283, rewards: 0.5863\n",
      "Iteration: 289, Train loss: -0.5617, rewards: 0.7173\n",
      "Iteration: 290, Train loss: -0.6048, rewards: 0.6750\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7066\n",
      "------------------------------------------------------------\n",
      "Iteration: 291, Train loss: -0.4038, rewards: 0.7375\n",
      "Iteration: 292, Train loss: -0.3730, rewards: 0.6565\n",
      "Iteration: 293, Train loss: -0.4245, rewards: 0.7542\n",
      "Iteration: 294, Train loss: -0.5017, rewards: 0.6571\n",
      "Iteration: 295, Train loss: -0.4078, rewards: 0.6238\n",
      "Iteration: 296, Train loss: -0.3046, rewards: 0.6982\n",
      "Iteration: 297, Train loss: -0.3210, rewards: 0.6804\n",
      "Iteration: 298, Train loss: -0.4341, rewards: 0.6845\n",
      "Iteration: 299, Train loss: -0.4346, rewards: 0.6786\n",
      "Iteration: 300, Train loss: -0.5277, rewards: 0.6935\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7143, Hits@10: 0.7143, MRR: 0.7035\n",
      "------------------------------------------------------------\n",
      "Iteration: 301, Train loss: -0.3684, rewards: 0.6488\n",
      "Iteration: 302, Train loss: -0.4284, rewards: 0.7310\n",
      "Iteration: 303, Train loss: -0.4306, rewards: 0.7298\n",
      "Iteration: 304, Train loss: -0.5559, rewards: 0.8083\n",
      "Iteration: 305, Train loss: -0.4978, rewards: 0.6113\n",
      "Iteration: 306, Train loss: -0.3796, rewards: 0.7429\n",
      "Iteration: 307, Train loss: -0.4513, rewards: 0.6393\n",
      "Iteration: 308, Train loss: -0.4403, rewards: 0.6137\n",
      "Iteration: 309, Train loss: -0.4409, rewards: 0.6738\n",
      "Iteration: 310, Train loss: -0.5727, rewards: 0.7375\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7014\n",
      "------------------------------------------------------------\n",
      "Iteration: 311, Train loss: -0.5425, rewards: 0.6399\n",
      "Iteration: 312, Train loss: -0.6155, rewards: 0.7411\n",
      "Iteration: 313, Train loss: -0.5214, rewards: 0.6518\n",
      "Iteration: 314, Train loss: -0.4263, rewards: 0.7202\n",
      "Iteration: 315, Train loss: -0.3867, rewards: 0.6363\n",
      "Iteration: 316, Train loss: -0.6475, rewards: 0.7065\n",
      "Iteration: 317, Train loss: -0.3813, rewards: 0.6446\n",
      "Iteration: 318, Train loss: -0.6112, rewards: 0.7274\n",
      "Iteration: 319, Train loss: -0.4519, rewards: 0.6625\n",
      "Iteration: 320, Train loss: -0.4500, rewards: 0.7286\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7005\n",
      "------------------------------------------------------------\n",
      "Iteration: 321, Train loss: -0.4445, rewards: 0.6935\n",
      "Iteration: 322, Train loss: -0.3327, rewards: 0.6506\n",
      "Iteration: 323, Train loss: -0.6111, rewards: 0.7030\n",
      "Iteration: 324, Train loss: -0.4317, rewards: 0.6667\n",
      "Iteration: 325, Train loss: -0.4201, rewards: 0.7929\n",
      "Iteration: 326, Train loss: -0.3139, rewards: 0.6940\n",
      "Iteration: 327, Train loss: -0.3867, rewards: 0.7167\n",
      "Iteration: 328, Train loss: -0.2899, rewards: 0.7274\n",
      "Iteration: 329, Train loss: -0.5504, rewards: 0.6625\n",
      "Iteration: 330, Train loss: -0.5279, rewards: 0.7649\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7051, Hits@10: 0.7097, MRR: 0.7016\n",
      "------------------------------------------------------------\n",
      "Iteration: 331, Train loss: -0.4396, rewards: 0.6899\n",
      "Iteration: 332, Train loss: -0.5219, rewards: 0.6958\n",
      "Iteration: 333, Train loss: -0.3505, rewards: 0.7012\n",
      "Iteration: 334, Train loss: -0.3581, rewards: 0.7321\n",
      "Iteration: 335, Train loss: -0.2500, rewards: 0.6744\n",
      "Iteration: 336, Train loss: -0.4110, rewards: 0.7577\n",
      "Iteration: 337, Train loss: -0.2741, rewards: 0.6518\n",
      "Iteration: 338, Train loss: -0.4923, rewards: 0.7054\n",
      "Iteration: 339, Train loss: -0.3478, rewards: 0.7060\n",
      "Iteration: 340, Train loss: -0.4994, rewards: 0.6548\n",
      "Eval:\n",
      "Hits@1: 0.6866, Hits@3: 0.7097, Hits@10: 0.7143, MRR: 0.6985\n",
      "------------------------------------------------------------\n",
      "Iteration: 341, Train loss: -0.5067, rewards: 0.6601\n",
      "Iteration: 342, Train loss: -0.5507, rewards: 0.6601\n",
      "Iteration: 343, Train loss: -0.4816, rewards: 0.7256\n",
      "Iteration: 344, Train loss: -0.4228, rewards: 0.7714\n",
      "Iteration: 345, Train loss: -0.4157, rewards: 0.7167\n",
      "Iteration: 346, Train loss: -0.4028, rewards: 0.6958\n",
      "Iteration: 347, Train loss: -0.5323, rewards: 0.5917\n",
      "Iteration: 348, Train loss: -0.3631, rewards: 0.5845\n",
      "Iteration: 349, Train loss: -0.4277, rewards: 0.8024\n",
      "Iteration: 350, Train loss: -0.4921, rewards: 0.7726\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7028\n",
      "------------------------------------------------------------\n",
      "Iteration: 351, Train loss: -0.3257, rewards: 0.6768\n",
      "Iteration: 352, Train loss: -0.4266, rewards: 0.6798\n",
      "Iteration: 353, Train loss: -0.3686, rewards: 0.6643\n",
      "Iteration: 354, Train loss: -0.5209, rewards: 0.7161\n",
      "Iteration: 355, Train loss: -0.4256, rewards: 0.7399\n",
      "Iteration: 356, Train loss: -0.4596, rewards: 0.6815\n",
      "Iteration: 357, Train loss: -0.4183, rewards: 0.6470\n",
      "Iteration: 358, Train loss: -0.7186, rewards: 0.6839\n",
      "Iteration: 359, Train loss: -0.5290, rewards: 0.6780\n",
      "Iteration: 360, Train loss: -0.4097, rewards: 0.7244\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7020\n",
      "------------------------------------------------------------\n",
      "Iteration: 361, Train loss: -0.5610, rewards: 0.7286\n",
      "Iteration: 362, Train loss: -0.4515, rewards: 0.7012\n",
      "Iteration: 363, Train loss: -0.2308, rewards: 0.6315\n",
      "Iteration: 364, Train loss: -0.1582, rewards: 0.8220\n",
      "Iteration: 365, Train loss: -0.4543, rewards: 0.7196\n",
      "Iteration: 366, Train loss: -0.4141, rewards: 0.6643\n",
      "Iteration: 367, Train loss: -0.3078, rewards: 0.6571\n",
      "Iteration: 368, Train loss: -0.3451, rewards: 0.7161\n",
      "Iteration: 369, Train loss: -0.4763, rewards: 0.6946\n",
      "Iteration: 370, Train loss: -0.3374, rewards: 0.6774\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7055\n",
      "------------------------------------------------------------\n",
      "Iteration: 371, Train loss: -0.3248, rewards: 0.6982\n",
      "Iteration: 372, Train loss: -0.4073, rewards: 0.7512\n",
      "Iteration: 373, Train loss: -0.4732, rewards: 0.6238\n",
      "Iteration: 374, Train loss: -0.4065, rewards: 0.7048\n",
      "Iteration: 375, Train loss: -0.5101, rewards: 0.6012\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 376, Train loss: -0.4064, rewards: 0.6786\n",
      "Iteration: 377, Train loss: -0.5131, rewards: 0.6488\n",
      "Iteration: 378, Train loss: -0.4024, rewards: 0.6923\n",
      "Iteration: 379, Train loss: -0.4744, rewards: 0.7554\n",
      "Iteration: 380, Train loss: -0.4593, rewards: 0.6631\n",
      "Eval:\n",
      "Hits@1: 0.7005, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7051\n",
      "------------------------------------------------------------\n",
      "Iteration: 381, Train loss: -0.4566, rewards: 0.7256\n",
      "Iteration: 382, Train loss: -0.4694, rewards: 0.7173\n",
      "Iteration: 383, Train loss: -0.4603, rewards: 0.7256\n",
      "Iteration: 384, Train loss: -0.4405, rewards: 0.6970\n",
      "Iteration: 385, Train loss: -0.5118, rewards: 0.7470\n",
      "Iteration: 386, Train loss: -0.3566, rewards: 0.7179\n",
      "Iteration: 387, Train loss: -0.3988, rewards: 0.7185\n",
      "Iteration: 388, Train loss: -0.5872, rewards: 0.5982\n",
      "Iteration: 389, Train loss: -0.4205, rewards: 0.7113\n",
      "Iteration: 390, Train loss: -0.5238, rewards: 0.6601\n",
      "Eval:\n",
      "Hits@1: 0.6959, Hits@3: 0.7097, Hits@10: 0.7097, MRR: 0.7028\n",
      "------------------------------------------------------------\n",
      "Iteration: 391, Train loss: -0.4999, rewards: 0.5780\n",
      "Iteration: 392, Train loss: -0.2741, rewards: 0.6881\n",
      "Iteration: 393, Train loss: -0.4278, rewards: 0.6988\n",
      "Iteration: 394, Train loss: -0.6158, rewards: 0.6280\n",
      "Iteration: 395, Train loss: -0.5478, rewards: 0.6345\n",
      "Iteration: 396, Train loss: -0.4348, rewards: 0.6685\n",
      "Iteration: 397, Train loss: -0.4107, rewards: 0.7375\n",
      "Iteration: 398, Train loss: -0.6678, rewards: 0.6393\n",
      "Iteration: 399, Train loss: -0.5836, rewards: 0.7619\n",
      "Iteration: 400, Train loss: -0.5290, rewards: 0.6494\n",
      "Eval:\n",
      "Hits@1: 0.6912, Hits@3: 0.7051, Hits@10: 0.7051, MRR: 0.6974\n",
      "------------------------------------------------------------\n",
      "Iteration: 401, Train loss: -0.6112, rewards: 0.6113\n",
      "Iteration: 402, Train loss: -0.2346, rewards: 0.6631\n",
      "Iteration: 403, Train loss: -0.2956, rewards: 0.6345\n",
      "Iteration: 404, Train loss: -0.3138, rewards: 0.7810\n",
      "Iteration: 405, Train loss: -0.3372, rewards: 0.6512\n",
      "Iteration: 406, Train loss: -0.2107, rewards: 0.5143\n"
     ]
    }
   ],
   "source": [
    "sub_task = sub_tasks_list[0]\n",
    "study = optuna.create_study(storage=f\"sqlite:///{sub_task}.db\", study_name=f\"{sub_task}\", direction = 'maximize')\n",
    "study.optimize(objective, n_trials=1000)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
