{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "b2479ab1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-dc67f6ae-4c27-5869-bcd2-8560a2da46c7\"\n",
    "\n",
    "from model.ours3 import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "a39d5a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    \n",
    "    options['use_cuda'] = True\n",
    "    options['vocab_dir'] = '../MINERVA/datasets/data_preprocessed/nell/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_nell995-1/'\n",
    "        options['output_dir'] = './outputs_nell995-1/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_nell995-1/'\n",
    "        options['model_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = 1\n",
    "    options['max_num_actions'] = 40\n",
    "    options['gnn_layer'] = 2\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 40\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = 64\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = 0.15\n",
    "    options['Lambda'] = 0.15\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = 0.00005\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 5\n",
    "    options['total_iterations'] = 20*(64/options['batch_size'])\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "12f1b8ba",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n"
     ]
    }
   ],
   "source": [
    "params = set_params()\n",
    "params['test_rollouts'] = 100\n",
    "params['max_num_actions'] = 100\n",
    "params['eval_batch_size'] = 8\n",
    "\n",
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "17bc5425",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8207787473535506 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6278593427818233 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.572523027000639 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8249362244897959 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9319237147595357 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.9153204137843777 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.8065181795751745 (193 queries evaluated)\n",
      "WorksFor.txt\n",
      "MINERVA MAP: 0.8287528177373783 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.9408317251690747 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8386739927983896 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "map_list = {}    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "    \n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    map_list[sub_task] = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              trainer.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "10a372ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "import optuna\n",
    "from model.ours3 import *\n",
    "global sub_tasks_list\n",
    "\n",
    "\n",
    "sub_tasks_list = [\n",
    "# 'AthletePlaysInLeague',\n",
    "# 'AthletePlaysForTeam ',\n",
    "#'AthleteHomeStadium '\n",
    "#'TeamPlaysSport',\n",
    "# 'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "#'PersonBornInLocation'\n",
    "# 'WorksFor',\n",
    "# 'organizationheadquarteredincity',\n",
    "#'PersonLeadsOrganization'\n",
    "]\n",
    "\n",
    "def objective(trial):\n",
    "    \n",
    "    sub_task = sub_tasks_list[0]\n",
    "\n",
    "    lr = trial.suggest_float('lr', 1e-6, 1e-2)\n",
    "    bs = trial.suggest_int('bs', 4, 128)\n",
    "    b = trial.suggest_float('b', 0, 0.5)\n",
    "    l = trial.suggest_float('l', 0, 0.5)\n",
    "    ee = trial.suggest_categorical('ee', [10,20,50,100])\n",
    "\n",
    "    params = set_params(sub_task.lower().strip())\n",
    "    params['learning_rate'] = lr\n",
    "    params['eval_every'] = ee\n",
    "    params['batch_size'] = bs\n",
    "    params['beta'] = b\n",
    "    params['Lambda'] = l\n",
    "    params['total_iterations'] = min(50*params['eval_every'], 2000)\n",
    "\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    #     torch.save(sub_trainer.agent.state_dict(), params['model_dir'] + 'tmp.ckpt')\n",
    "\n",
    "    params['test_rollouts'] = 100\n",
    "    params['max_num_actions'] = 100\n",
    "    params['eval_batch_size'] = 8\n",
    "\n",
    "    sub_tester = Trainer(params)\n",
    "    sub_tester.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_tester.agent.eval()\n",
    "\n",
    "    save_path = sub_tester.save_path\n",
    "    output_dir = sub_tester.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_tester.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_tester.test_environment = sub_tester.test_test_environment\n",
    "    test_results = sub_tester.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_tester.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "\n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              sub_tester.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')\n",
    "\n",
    "    del sub_tester, sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()\n",
    "    \n",
    "    return MAP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ae521015",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-29 20:35:56,547]\u001b[0m A new study created in RDB with name: OrganizationHiredPerson\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/root/miniconda3/lib/python3.10/site-packages/torch/nn/_reduction.py:42: UserWarning: size_average and reduce args will be deprecated, please use reduction='none' instead.\n",
      "  warnings.warn(warning.format(ret))\n",
      "/root/Research/GraphRL/experiments/model/ours3.py:334: UserWarning: Implicit dimension choice for log_softmax has been deprecated. Change the call to include dim=X as an argument.\n",
      "  return loss, new_state, F.log_softmax(scores), label_action, chosen_relation\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 5, Train loss: -1.1495, rewards: 0.1134\n",
      "Iteration: 10, Train loss: -1.3009, rewards: 0.1275\n",
      "Iteration: 15, Train loss: -1.3588, rewards: 0.1476\n",
      "Iteration: 20, Train loss: -1.3650, rewards: 0.1501\n",
      "Iteration: 25, Train loss: -1.3368, rewards: 0.1559\n",
      "Iteration: 30, Train loss: -1.4039, rewards: 0.1946\n",
      "Iteration: 35, Train loss: -1.4646, rewards: 0.2152\n",
      "Iteration: 40, Train loss: -1.4522, rewards: 0.2199\n",
      "Iteration: 45, Train loss: -1.5234, rewards: 0.2348\n",
      "Iteration: 50, Train loss: -1.4551, rewards: 0.2382\n",
      "Eval:\n",
      "Hits@1: 0.3613, Hits@3: 0.4181, Hits@10: 0.4727, MRR: 0.3969\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -1.4614, rewards: 0.2485\n",
      "Iteration: 60, Train loss: -1.5118, rewards: 0.2768\n",
      "Iteration: 65, Train loss: -1.5741, rewards: 0.2724\n",
      "Iteration: 70, Train loss: -1.5219, rewards: 0.2693\n",
      "Iteration: 75, Train loss: -1.4486, rewards: 0.2790\n",
      "Iteration: 80, Train loss: -1.5318, rewards: 0.2609\n",
      "Iteration: 85, Train loss: -1.4937, rewards: 0.2933\n",
      "Iteration: 90, Train loss: -1.5287, rewards: 0.2516\n",
      "Iteration: 95, Train loss: -1.5433, rewards: 0.3143\n",
      "Iteration: 100, Train loss: -1.5730, rewards: 0.2774\n",
      "Eval:\n",
      "Hits@1: 0.3908, Hits@3: 0.4223, Hits@10: 0.4517, MRR: 0.4101\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -1.5568, rewards: 0.3287\n",
      "Iteration: 110, Train loss: -1.5690, rewards: 0.2975\n",
      "Iteration: 115, Train loss: -1.4655, rewards: 0.3372\n",
      "Iteration: 120, Train loss: -1.5357, rewards: 0.2940\n",
      "Iteration: 125, Train loss: -1.5719, rewards: 0.3428\n",
      "Iteration: 130, Train loss: -1.5394, rewards: 0.2947\n",
      "Iteration: 135, Train loss: -1.5195, rewards: 0.3256\n",
      "Iteration: 140, Train loss: -1.5216, rewards: 0.3174\n",
      "Iteration: 145, Train loss: -1.5434, rewards: 0.3240\n",
      "Iteration: 150, Train loss: -1.5455, rewards: 0.2970\n",
      "Eval:\n",
      "Hits@1: 0.4013, Hits@3: 0.4265, Hits@10: 0.4496, MRR: 0.4170\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -1.5492, rewards: 0.3161\n",
      "Iteration: 160, Train loss: -1.5821, rewards: 0.3160\n",
      "Iteration: 165, Train loss: -1.5860, rewards: 0.3080\n",
      "Iteration: 170, Train loss: -1.5393, rewards: 0.3314\n",
      "Iteration: 175, Train loss: -1.5191, rewards: 0.3275\n",
      "Iteration: 180, Train loss: -1.5640, rewards: 0.2793\n",
      "Iteration: 185, Train loss: -1.5131, rewards: 0.3846\n",
      "Iteration: 190, Train loss: -1.5893, rewards: 0.3219\n",
      "Iteration: 195, Train loss: -1.5312, rewards: 0.3128\n",
      "Iteration: 200, Train loss: -1.4976, rewards: 0.3543\n",
      "Eval:\n",
      "Hits@1: 0.4076, Hits@3: 0.4328, Hits@10: 0.4601, MRR: 0.4233\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -1.5525, rewards: 0.3343\n",
      "Iteration: 210, Train loss: -1.5029, rewards: 0.3446\n",
      "Iteration: 215, Train loss: -1.4973, rewards: 0.3325\n",
      "Iteration: 220, Train loss: -1.5518, rewards: 0.3041\n",
      "Iteration: 225, Train loss: -1.6056, rewards: 0.3506\n",
      "Iteration: 230, Train loss: -1.5389, rewards: 0.3776\n",
      "Iteration: 235, Train loss: -1.4609, rewards: 0.3085\n",
      "Iteration: 240, Train loss: -1.4940, rewards: 0.3398\n",
      "Iteration: 245, Train loss: -1.4966, rewards: 0.3654\n",
      "Iteration: 250, Train loss: -1.5767, rewards: 0.3416\n",
      "Eval:\n",
      "Hits@1: 0.4013, Hits@3: 0.4391, Hits@10: 0.4622, MRR: 0.4230\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -1.5285, rewards: 0.3149\n",
      "Iteration: 260, Train loss: -1.5697, rewards: 0.3587\n",
      "Iteration: 265, Train loss: -1.5683, rewards: 0.3287\n",
      "Iteration: 270, Train loss: -1.5846, rewards: 0.3275\n",
      "Iteration: 275, Train loss: -1.6101, rewards: 0.3470\n",
      "Iteration: 280, Train loss: -1.5297, rewards: 0.3346\n",
      "Iteration: 285, Train loss: -1.5849, rewards: 0.3432\n",
      "Iteration: 290, Train loss: -1.5179, rewards: 0.3175\n",
      "Iteration: 295, Train loss: -1.6198, rewards: 0.3295\n",
      "Iteration: 300, Train loss: -1.5646, rewards: 0.3462\n",
      "Eval:\n",
      "Hits@1: 0.3971, Hits@3: 0.4286, Hits@10: 0.4580, MRR: 0.4153\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -1.5409, rewards: 0.3289\n",
      "Iteration: 310, Train loss: -1.4980, rewards: 0.3303\n",
      "Iteration: 315, Train loss: -1.5544, rewards: 0.3396\n",
      "Iteration: 320, Train loss: -1.4601, rewards: 0.3159\n",
      "Iteration: 325, Train loss: -1.5634, rewards: 0.3433\n",
      "Iteration: 330, Train loss: -1.5744, rewards: 0.3409\n",
      "Iteration: 335, Train loss: -1.5355, rewards: 0.3602\n",
      "Iteration: 340, Train loss: -1.5588, rewards: 0.3238\n",
      "Iteration: 345, Train loss: -1.5566, rewards: 0.3108\n",
      "Iteration: 350, Train loss: -1.5353, rewards: 0.3141\n",
      "Eval:\n",
      "Hits@1: 0.4055, Hits@3: 0.4391, Hits@10: 0.4601, MRR: 0.4233\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -1.5691, rewards: 0.3530\n",
      "Iteration: 360, Train loss: -1.5665, rewards: 0.3264\n",
      "Iteration: 365, Train loss: -1.5508, rewards: 0.3846\n",
      "Iteration: 370, Train loss: -1.5622, rewards: 0.3447\n",
      "Iteration: 375, Train loss: -1.5453, rewards: 0.3610\n",
      "Iteration: 380, Train loss: -1.5732, rewards: 0.3327\n",
      "Iteration: 385, Train loss: -1.5917, rewards: 0.3431\n",
      "Iteration: 390, Train loss: -1.5055, rewards: 0.3267\n",
      "Iteration: 395, Train loss: -1.5474, rewards: 0.3385\n",
      "Iteration: 400, Train loss: -1.5404, rewards: 0.3528\n",
      "Eval:\n",
      "Hits@1: 0.4244, Hits@3: 0.4370, Hits@10: 0.4601, MRR: 0.4341\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -1.5628, rewards: 0.3558\n",
      "Iteration: 410, Train loss: -1.5402, rewards: 0.3328\n",
      "Iteration: 415, Train loss: -1.5496, rewards: 0.3533\n",
      "Iteration: 420, Train loss: -1.5340, rewards: 0.3577\n",
      "Iteration: 425, Train loss: -1.5162, rewards: 0.3390\n",
      "Iteration: 430, Train loss: -1.5474, rewards: 0.3608\n",
      "Iteration: 435, Train loss: -1.5759, rewards: 0.3615\n",
      "Iteration: 440, Train loss: -1.5480, rewards: 0.3574\n",
      "Iteration: 445, Train loss: -1.5583, rewards: 0.3354\n",
      "Iteration: 450, Train loss: -1.5286, rewards: 0.3490\n",
      "Eval:\n",
      "Hits@1: 0.4013, Hits@3: 0.4328, Hits@10: 0.4538, MRR: 0.4187\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -1.5012, rewards: 0.3632\n",
      "Iteration: 460, Train loss: -1.5065, rewards: 0.3691\n",
      "Iteration: 465, Train loss: -1.5254, rewards: 0.3293\n",
      "Iteration: 470, Train loss: -1.5688, rewards: 0.3776\n",
      "Iteration: 475, Train loss: -1.5072, rewards: 0.3451\n",
      "Iteration: 480, Train loss: -1.5506, rewards: 0.3549\n",
      "Iteration: 485, Train loss: -1.5093, rewards: 0.3896\n",
      "Iteration: 490, Train loss: -1.5519, rewards: 0.3408\n",
      "Iteration: 495, Train loss: -1.5732, rewards: 0.3527\n",
      "Iteration: 500, Train loss: -1.6005, rewards: 0.4131\n",
      "Eval:\n",
      "Hits@1: 0.4034, Hits@3: 0.4328, Hits@10: 0.4538, MRR: 0.4191\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -1.5334, rewards: 0.3427\n",
      "Iteration: 510, Train loss: -1.5425, rewards: 0.3480\n",
      "Iteration: 515, Train loss: -1.6038, rewards: 0.3742\n",
      "Iteration: 520, Train loss: -1.5322, rewards: 0.3375\n",
      "Iteration: 525, Train loss: -1.5513, rewards: 0.3166\n",
      "Iteration: 530, Train loss: -1.5790, rewards: 0.3588\n",
      "Iteration: 535, Train loss: -1.5704, rewards: 0.3514\n",
      "Iteration: 540, Train loss: -1.5583, rewards: 0.3374\n",
      "Iteration: 545, Train loss: -1.5601, rewards: 0.3215\n",
      "Iteration: 550, Train loss: -1.5344, rewards: 0.3908\n",
      "Eval:\n",
      "Hits@1: 0.4181, Hits@3: 0.4349, Hits@10: 0.4601, MRR: 0.4296\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -1.5588, rewards: 0.3367\n",
      "Iteration: 560, Train loss: -1.5767, rewards: 0.3318\n",
      "Iteration: 565, Train loss: -1.5678, rewards: 0.3635\n",
      "Iteration: 570, Train loss: -1.5367, rewards: 0.3814\n",
      "Iteration: 575, Train loss: -1.5519, rewards: 0.3807\n",
      "Iteration: 580, Train loss: -1.5522, rewards: 0.3572\n",
      "Iteration: 585, Train loss: -1.5642, rewards: 0.3549\n",
      "Iteration: 590, Train loss: -1.5625, rewards: 0.3498\n",
      "Iteration: 595, Train loss: -1.6092, rewards: 0.3798\n",
      "Iteration: 600, Train loss: -1.5050, rewards: 0.3339\n",
      "Eval:\n",
      "Hits@1: 0.3782, Hits@3: 0.3950, Hits@10: 0.4328, MRR: 0.3921\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -1.5479, rewards: 0.3839\n",
      "Iteration: 610, Train loss: -1.5350, rewards: 0.3573\n",
      "Iteration: 615, Train loss: -1.5531, rewards: 0.3448\n",
      "Iteration: 620, Train loss: -1.5321, rewards: 0.3499\n",
      "Iteration: 625, Train loss: -1.5334, rewards: 0.3597\n",
      "Iteration: 630, Train loss: -1.5596, rewards: 0.3619\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 635, Train loss: -1.5860, rewards: 0.3642\n",
      "Iteration: 640, Train loss: -1.5662, rewards: 0.3614\n",
      "Iteration: 645, Train loss: -1.5436, rewards: 0.3411\n",
      "Iteration: 650, Train loss: -1.4959, rewards: 0.3694\n",
      "Eval:\n",
      "Hits@1: 0.4202, Hits@3: 0.4433, Hits@10: 0.4622, MRR: 0.4347\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -1.5140, rewards: 0.3674\n",
      "Iteration: 660, Train loss: -1.4341, rewards: 0.3600\n",
      "Iteration: 665, Train loss: -1.4543, rewards: 0.3728\n",
      "Iteration: 670, Train loss: -1.5850, rewards: 0.3573\n",
      "Iteration: 675, Train loss: -1.5442, rewards: 0.3421\n",
      "Iteration: 680, Train loss: -1.5305, rewards: 0.3732\n",
      "Iteration: 685, Train loss: -1.5902, rewards: 0.3466\n",
      "Iteration: 690, Train loss: -1.4655, rewards: 0.3570\n",
      "Iteration: 695, Train loss: -1.5106, rewards: 0.3621\n",
      "Iteration: 700, Train loss: -1.6060, rewards: 0.3576\n",
      "Eval:\n",
      "Hits@1: 0.4055, Hits@3: 0.4307, Hits@10: 0.4538, MRR: 0.4205\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -1.5223, rewards: 0.3482\n",
      "Iteration: 710, Train loss: -1.5120, rewards: 0.3741\n",
      "Iteration: 715, Train loss: -1.5714, rewards: 0.3526\n",
      "Iteration: 720, Train loss: -1.5254, rewards: 0.3588\n",
      "Iteration: 725, Train loss: -1.6030, rewards: 0.3523\n",
      "Iteration: 730, Train loss: -1.5358, rewards: 0.3557\n",
      "Iteration: 735, Train loss: -1.4977, rewards: 0.4140\n",
      "Iteration: 740, Train loss: -1.5088, rewards: 0.3469\n",
      "Iteration: 745, Train loss: -1.4644, rewards: 0.3503\n",
      "Iteration: 750, Train loss: -1.4892, rewards: 0.3923\n",
      "Eval:\n",
      "Hits@1: 0.3761, Hits@3: 0.3908, Hits@10: 0.4328, MRR: 0.3905\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -1.5036, rewards: 0.3414\n",
      "Iteration: 760, Train loss: -1.5287, rewards: 0.3694\n",
      "Iteration: 765, Train loss: -1.5504, rewards: 0.3614\n",
      "Iteration: 770, Train loss: -1.5800, rewards: 0.3815\n",
      "Iteration: 775, Train loss: -1.5712, rewards: 0.3261\n",
      "Iteration: 780, Train loss: -1.4885, rewards: 0.3592\n",
      "Iteration: 785, Train loss: -1.5870, rewards: 0.3522\n",
      "Iteration: 790, Train loss: -1.5471, rewards: 0.3349\n",
      "Iteration: 795, Train loss: -1.5647, rewards: 0.3685\n",
      "Iteration: 800, Train loss: -1.5401, rewards: 0.3263\n",
      "Eval:\n",
      "Hits@1: 0.3992, Hits@3: 0.4223, Hits@10: 0.4454, MRR: 0.4134\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -1.5395, rewards: 0.3916\n",
      "Iteration: 810, Train loss: -1.5861, rewards: 0.3842\n",
      "Iteration: 815, Train loss: -1.5901, rewards: 0.3393\n",
      "Iteration: 820, Train loss: -1.5458, rewards: 0.3875\n",
      "Iteration: 825, Train loss: -1.5607, rewards: 0.3332\n",
      "Iteration: 830, Train loss: -1.6049, rewards: 0.3846\n",
      "Iteration: 835, Train loss: -1.5208, rewards: 0.3764\n",
      "Iteration: 840, Train loss: -1.6205, rewards: 0.3775\n",
      "Iteration: 845, Train loss: -1.5762, rewards: 0.3559\n",
      "Iteration: 850, Train loss: -1.6289, rewards: 0.3384\n",
      "Eval:\n",
      "Hits@1: 0.3782, Hits@3: 0.3950, Hits@10: 0.4328, MRR: 0.3921\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -1.5644, rewards: 0.3568\n",
      "Iteration: 860, Train loss: -1.5393, rewards: 0.3419\n",
      "Iteration: 865, Train loss: -1.5684, rewards: 0.3692\n",
      "Iteration: 870, Train loss: -1.5554, rewards: 0.3681\n",
      "Iteration: 875, Train loss: -1.5667, rewards: 0.3596\n",
      "Iteration: 880, Train loss: -1.5973, rewards: 0.3657\n",
      "Iteration: 885, Train loss: -1.5628, rewards: 0.3410\n",
      "Iteration: 890, Train loss: -1.5208, rewards: 0.3618\n",
      "Iteration: 895, Train loss: -1.5225, rewards: 0.4022\n",
      "Iteration: 900, Train loss: -1.5465, rewards: 0.3868\n",
      "Eval:\n",
      "Hits@1: 0.4034, Hits@3: 0.4181, Hits@10: 0.4475, MRR: 0.4153\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -1.5971, rewards: 0.3894\n",
      "Iteration: 910, Train loss: -1.5657, rewards: 0.3751\n",
      "Iteration: 915, Train loss: -1.5726, rewards: 0.3504\n",
      "Iteration: 920, Train loss: -1.5750, rewards: 0.3775\n",
      "Iteration: 925, Train loss: -1.5548, rewards: 0.3818\n",
      "Iteration: 930, Train loss: -1.5631, rewards: 0.3528\n",
      "Iteration: 935, Train loss: -1.6017, rewards: 0.3768\n",
      "Iteration: 940, Train loss: -1.5336, rewards: 0.3367\n",
      "Iteration: 945, Train loss: -1.5225, rewards: 0.4135\n",
      "Iteration: 950, Train loss: -1.5571, rewards: 0.3757\n",
      "Eval:\n",
      "Hits@1: 0.3971, Hits@3: 0.4160, Hits@10: 0.4496, MRR: 0.4110\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -1.5429, rewards: 0.3476\n",
      "Iteration: 960, Train loss: -1.6370, rewards: 0.3574\n",
      "Iteration: 965, Train loss: -1.4702, rewards: 0.3810\n",
      "Iteration: 970, Train loss: -1.5827, rewards: 0.3401\n",
      "Iteration: 975, Train loss: -1.5850, rewards: 0.3890\n",
      "Iteration: 980, Train loss: -1.6313, rewards: 0.3818\n",
      "Iteration: 985, Train loss: -1.5364, rewards: 0.3612\n",
      "Iteration: 990, Train loss: -1.5539, rewards: 0.3796\n",
      "Iteration: 995, Train loss: -1.5928, rewards: 0.3714\n",
      "Iteration: 1000, Train loss: -1.5839, rewards: 0.3646\n",
      "Eval:\n",
      "Hits@1: 0.3803, Hits@3: 0.3929, Hits@10: 0.4286, MRR: 0.3915\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -1.5985, rewards: 0.3679\n",
      "Iteration: 1010, Train loss: -1.5971, rewards: 0.3293\n",
      "Iteration: 1015, Train loss: -1.5302, rewards: 0.3623\n",
      "Iteration: 1020, Train loss: -1.5570, rewards: 0.3503\n",
      "Iteration: 1025, Train loss: -1.5129, rewards: 0.3734\n",
      "Iteration: 1030, Train loss: -1.5492, rewards: 0.3445\n",
      "Iteration: 1035, Train loss: -1.5265, rewards: 0.3798\n",
      "Iteration: 1040, Train loss: -1.5073, rewards: 0.3703\n",
      "Iteration: 1045, Train loss: -1.5600, rewards: 0.3575\n",
      "Iteration: 1050, Train loss: -1.6228, rewards: 0.3786\n",
      "Eval:\n",
      "Hits@1: 0.4076, Hits@3: 0.4286, Hits@10: 0.4496, MRR: 0.4199\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -1.5466, rewards: 0.3880\n",
      "Iteration: 1060, Train loss: -1.5456, rewards: 0.3666\n",
      "Iteration: 1065, Train loss: -1.5745, rewards: 0.3539\n",
      "Iteration: 1070, Train loss: -1.5631, rewards: 0.3736\n",
      "Iteration: 1075, Train loss: -1.5633, rewards: 0.3733\n",
      "Iteration: 1080, Train loss: -1.5011, rewards: 0.3540\n",
      "Iteration: 1085, Train loss: -1.5758, rewards: 0.3855\n",
      "Iteration: 1090, Train loss: -1.5586, rewards: 0.3661\n",
      "Iteration: 1095, Train loss: -1.5456, rewards: 0.3629\n",
      "Iteration: 1100, Train loss: -1.4876, rewards: 0.3728\n",
      "Eval:\n",
      "Hits@1: 0.3613, Hits@3: 0.3739, Hits@10: 0.4097, MRR: 0.3735\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -1.5784, rewards: 0.4046\n",
      "Iteration: 1110, Train loss: -1.6235, rewards: 0.3518\n",
      "Iteration: 1115, Train loss: -1.5515, rewards: 0.3478\n",
      "Iteration: 1120, Train loss: -1.5763, rewards: 0.3672\n",
      "Iteration: 1125, Train loss: -1.5317, rewards: 0.3748\n",
      "Iteration: 1130, Train loss: -1.5773, rewards: 0.3778\n",
      "Iteration: 1135, Train loss: -1.5413, rewards: 0.3769\n",
      "Iteration: 1140, Train loss: -1.5598, rewards: 0.3667\n",
      "Iteration: 1145, Train loss: -1.4725, rewards: 0.3720\n",
      "Iteration: 1150, Train loss: -1.5290, rewards: 0.3651\n",
      "Eval:\n",
      "Hits@1: 0.3887, Hits@3: 0.4118, Hits@10: 0.4412, MRR: 0.4031\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -1.5145, rewards: 0.3716\n",
      "Iteration: 1160, Train loss: -1.4818, rewards: 0.3858\n",
      "Iteration: 1165, Train loss: -1.4864, rewards: 0.3557\n",
      "Iteration: 1170, Train loss: -1.5262, rewards: 0.3579\n",
      "Iteration: 1175, Train loss: -1.5435, rewards: 0.3635\n",
      "Iteration: 1180, Train loss: -1.5733, rewards: 0.3753\n",
      "Iteration: 1185, Train loss: -1.5519, rewards: 0.3409\n",
      "Iteration: 1190, Train loss: -1.5276, rewards: 0.3972\n",
      "Iteration: 1195, Train loss: -1.5422, rewards: 0.3377\n",
      "Iteration: 1200, Train loss: -1.5347, rewards: 0.3472\n",
      "Eval:\n",
      "Hits@1: 0.3803, Hits@3: 0.3950, Hits@10: 0.4433, MRR: 0.3956\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -1.6363, rewards: 0.3601\n",
      "Iteration: 1210, Train loss: -1.4870, rewards: 0.3957\n",
      "Iteration: 1215, Train loss: -1.5507, rewards: 0.3653\n",
      "Iteration: 1220, Train loss: -1.5854, rewards: 0.3823\n",
      "Iteration: 1225, Train loss: -1.5911, rewards: 0.3637\n",
      "Iteration: 1230, Train loss: -1.5392, rewards: 0.4164\n",
      "Iteration: 1235, Train loss: -1.6002, rewards: 0.3895\n",
      "Iteration: 1240, Train loss: -1.5469, rewards: 0.3886\n",
      "Iteration: 1245, Train loss: -1.5853, rewards: 0.3819\n",
      "Iteration: 1250, Train loss: -1.4987, rewards: 0.4047\n",
      "Eval:\n",
      "Hits@1: 0.3634, Hits@3: 0.3845, Hits@10: 0.4307, MRR: 0.3796\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -1.5841, rewards: 0.3375\n",
      "Iteration: 1260, Train loss: -1.5195, rewards: 0.3829\n",
      "Iteration: 1265, Train loss: -1.5299, rewards: 0.3626\n",
      "Iteration: 1270, Train loss: -1.5653, rewards: 0.3855\n",
      "Iteration: 1275, Train loss: -1.6035, rewards: 0.3763\n",
      "Iteration: 1280, Train loss: -1.5091, rewards: 0.3363\n",
      "Iteration: 1285, Train loss: -1.5683, rewards: 0.3793\n",
      "Iteration: 1290, Train loss: -1.5806, rewards: 0.3790\n",
      "Iteration: 1295, Train loss: -1.5360, rewards: 0.3644\n",
      "Iteration: 1300, Train loss: -1.5632, rewards: 0.3440\n",
      "Eval:\n",
      "Hits@1: 0.3277, Hits@3: 0.3403, Hits@10: 0.3634, MRR: 0.3380\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -1.5431, rewards: 0.4163\n",
      "Iteration: 1310, Train loss: -1.5633, rewards: 0.3543\n",
      "Iteration: 1315, Train loss: -1.5415, rewards: 0.3824\n",
      "Iteration: 1320, Train loss: -1.5174, rewards: 0.3256\n",
      "Iteration: 1325, Train loss: -1.5808, rewards: 0.3655\n",
      "Iteration: 1330, Train loss: -1.5969, rewards: 0.3380\n",
      "Iteration: 1335, Train loss: -1.5650, rewards: 0.3544\n",
      "Iteration: 1340, Train loss: -1.5376, rewards: 0.3872\n",
      "Iteration: 1345, Train loss: -1.5877, rewards: 0.3422\n",
      "Iteration: 1350, Train loss: -1.5410, rewards: 0.3487\n",
      "Eval:\n",
      "Hits@1: 0.3887, Hits@3: 0.4160, Hits@10: 0.4475, MRR: 0.4064\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -1.5769, rewards: 0.4069\n",
      "Iteration: 1360, Train loss: -1.5902, rewards: 0.3657\n",
      "Iteration: 1365, Train loss: -1.5448, rewards: 0.3756\n",
      "Iteration: 1370, Train loss: -1.5639, rewards: 0.3882\n",
      "Iteration: 1375, Train loss: -1.5828, rewards: 0.3712\n",
      "Iteration: 1380, Train loss: -1.6294, rewards: 0.3445\n",
      "Iteration: 1385, Train loss: -1.5759, rewards: 0.4089\n",
      "Iteration: 1390, Train loss: -1.5900, rewards: 0.3613\n",
      "Iteration: 1395, Train loss: -1.5894, rewards: 0.3378\n",
      "Iteration: 1400, Train loss: -1.5663, rewards: 0.3981\n",
      "Eval:\n",
      "Hits@1: 0.3676, Hits@3: 0.3845, Hits@10: 0.4412, MRR: 0.3851\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -1.5388, rewards: 0.3766\n",
      "Iteration: 1410, Train loss: -1.4961, rewards: 0.3684\n",
      "Iteration: 1415, Train loss: -1.5730, rewards: 0.3819\n",
      "Iteration: 1420, Train loss: -1.5547, rewards: 0.3464\n",
      "Iteration: 1425, Train loss: -1.5386, rewards: 0.3597\n",
      "Iteration: 1430, Train loss: -1.5874, rewards: 0.3762\n",
      "Iteration: 1435, Train loss: -1.5632, rewards: 0.3469\n",
      "Iteration: 1440, Train loss: -1.5666, rewards: 0.4078\n",
      "Iteration: 1445, Train loss: -1.6155, rewards: 0.4297\n",
      "Iteration: 1450, Train loss: -1.5927, rewards: 0.3893\n",
      "Eval:\n",
      "Hits@1: 0.3550, Hits@3: 0.3634, Hits@10: 0.4139, MRR: 0.3685\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -1.5667, rewards: 0.3793\n",
      "Iteration: 1460, Train loss: -1.5297, rewards: 0.3800\n",
      "Iteration: 1465, Train loss: -1.5325, rewards: 0.3504\n",
      "Iteration: 1470, Train loss: -1.5902, rewards: 0.3973\n",
      "Iteration: 1475, Train loss: -1.5095, rewards: 0.3565\n",
      "Iteration: 1480, Train loss: -1.5437, rewards: 0.3626\n",
      "Iteration: 1485, Train loss: -1.5413, rewards: 0.3692\n",
      "Iteration: 1490, Train loss: -1.5734, rewards: 0.3939\n",
      "Iteration: 1495, Train loss: -1.5629, rewards: 0.3707\n",
      "Iteration: 1500, Train loss: -1.5554, rewards: 0.3738\n",
      "Eval:\n",
      "Hits@1: 0.3571, Hits@3: 0.3761, Hits@10: 0.4118, MRR: 0.3720\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -1.5777, rewards: 0.3582\n",
      "Iteration: 1510, Train loss: -1.5391, rewards: 0.3644\n",
      "Iteration: 1515, Train loss: -1.4803, rewards: 0.3896\n",
      "Iteration: 1520, Train loss: -1.5602, rewards: 0.3504\n",
      "Iteration: 1525, Train loss: -1.5541, rewards: 0.3778\n",
      "Iteration: 1530, Train loss: -1.5706, rewards: 0.3763\n",
      "Iteration: 1535, Train loss: -1.6045, rewards: 0.4132\n",
      "Iteration: 1540, Train loss: -1.5960, rewards: 0.3789\n",
      "Iteration: 1545, Train loss: -1.5955, rewards: 0.3830\n",
      "Iteration: 1550, Train loss: -1.5119, rewards: 0.3929\n",
      "Eval:\n",
      "Hits@1: 0.3845, Hits@3: 0.4118, Hits@10: 0.4517, MRR: 0.4039\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -1.6015, rewards: 0.3648\n",
      "Iteration: 1560, Train loss: -1.5703, rewards: 0.3543\n",
      "Iteration: 1565, Train loss: -1.4586, rewards: 0.3962\n",
      "Iteration: 1570, Train loss: -1.5856, rewards: 0.3774\n",
      "Iteration: 1575, Train loss: -1.5522, rewards: 0.3807\n",
      "Iteration: 1580, Train loss: -1.5922, rewards: 0.3480\n",
      "Iteration: 1585, Train loss: -1.5493, rewards: 0.3777\n",
      "Iteration: 1590, Train loss: -1.5250, rewards: 0.3655\n",
      "Iteration: 1595, Train loss: -1.5341, rewards: 0.3576\n",
      "Iteration: 1600, Train loss: -1.5736, rewards: 0.3835\n",
      "Eval:\n",
      "Hits@1: 0.3887, Hits@3: 0.4097, Hits@10: 0.4475, MRR: 0.4044\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -1.4847, rewards: 0.3648\n",
      "Iteration: 1610, Train loss: -1.5577, rewards: 0.3695\n",
      "Iteration: 1615, Train loss: -1.5261, rewards: 0.3754\n",
      "Iteration: 1620, Train loss: -1.5716, rewards: 0.3598\n",
      "Iteration: 1625, Train loss: -1.5878, rewards: 0.3735\n",
      "Iteration: 1630, Train loss: -1.5565, rewards: 0.3402\n",
      "Iteration: 1635, Train loss: -1.5302, rewards: 0.3806\n",
      "Iteration: 1640, Train loss: -1.5667, rewards: 0.3980\n",
      "Iteration: 1645, Train loss: -1.5370, rewards: 0.4022\n",
      "Iteration: 1650, Train loss: -1.5991, rewards: 0.3600\n",
      "Eval:\n",
      "Hits@1: 0.3887, Hits@3: 0.4160, Hits@10: 0.4559, MRR: 0.4064\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -1.5305, rewards: 0.3718\n",
      "Iteration: 1660, Train loss: -1.5717, rewards: 0.3636\n",
      "Iteration: 1665, Train loss: -1.6072, rewards: 0.3839\n",
      "Iteration: 1670, Train loss: -1.5260, rewards: 0.3837\n",
      "Iteration: 1675, Train loss: -1.5619, rewards: 0.3476\n",
      "Iteration: 1680, Train loss: -1.5744, rewards: 0.4022\n",
      "Iteration: 1685, Train loss: -1.5407, rewards: 0.3441\n",
      "Iteration: 1690, Train loss: -1.6336, rewards: 0.3711\n",
      "Iteration: 1695, Train loss: -1.4683, rewards: 0.3810\n",
      "Iteration: 1700, Train loss: -1.5621, rewards: 0.4093\n",
      "Eval:\n",
      "Hits@1: 0.3887, Hits@3: 0.3971, Hits@10: 0.4349, MRR: 0.3989\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -1.5700, rewards: 0.3541\n",
      "Iteration: 1710, Train loss: -1.4975, rewards: 0.3948\n",
      "Iteration: 1715, Train loss: -1.5299, rewards: 0.3285\n",
      "Iteration: 1720, Train loss: -1.6205, rewards: 0.3962\n",
      "Iteration: 1725, Train loss: -1.5729, rewards: 0.3957\n",
      "Iteration: 1730, Train loss: -1.5249, rewards: 0.3746\n",
      "Iteration: 1735, Train loss: -1.5667, rewards: 0.3765\n",
      "Iteration: 1740, Train loss: -1.5906, rewards: 0.4090\n",
      "Iteration: 1745, Train loss: -1.5479, rewards: 0.3613\n",
      "Iteration: 1750, Train loss: -1.5840, rewards: 0.3790\n",
      "Eval:\n",
      "Hits@1: 0.3655, Hits@3: 0.3739, Hits@10: 0.4265, MRR: 0.3785\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -1.5989, rewards: 0.3480\n",
      "Iteration: 1760, Train loss: -1.5693, rewards: 0.3978\n",
      "Iteration: 1765, Train loss: -1.6071, rewards: 0.3667\n",
      "Iteration: 1770, Train loss: -1.5516, rewards: 0.3843\n",
      "Iteration: 1775, Train loss: -1.5507, rewards: 0.3844\n",
      "Iteration: 1780, Train loss: -1.5782, rewards: 0.3706\n",
      "Iteration: 1785, Train loss: -1.5725, rewards: 0.3878\n",
      "Iteration: 1790, Train loss: -1.5170, rewards: 0.3130\n",
      "Iteration: 1795, Train loss: -1.5916, rewards: 0.3489\n",
      "Iteration: 1800, Train loss: -1.5484, rewards: 0.3901\n",
      "Eval:\n",
      "Hits@1: 0.3445, Hits@3: 0.3550, Hits@10: 0.3950, MRR: 0.3565\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -1.6030, rewards: 0.3643\n",
      "Iteration: 1810, Train loss: -1.5835, rewards: 0.3488\n",
      "Iteration: 1815, Train loss: -1.5128, rewards: 0.3737\n",
      "Iteration: 1820, Train loss: -1.5668, rewards: 0.3558\n",
      "Iteration: 1825, Train loss: -1.5694, rewards: 0.3667\n",
      "Iteration: 1830, Train loss: -1.5491, rewards: 0.3626\n",
      "Iteration: 1835, Train loss: -1.5940, rewards: 0.4042\n",
      "Iteration: 1840, Train loss: -1.5311, rewards: 0.3937\n",
      "Iteration: 1845, Train loss: -1.5330, rewards: 0.3576\n",
      "Iteration: 1850, Train loss: -1.5313, rewards: 0.3780\n",
      "Eval:\n",
      "Hits@1: 0.3634, Hits@3: 0.3824, Hits@10: 0.4223, MRR: 0.3801\n",
      "------------------------------------------------------------\n",
      "Iteration: 1855, Train loss: -1.5508, rewards: 0.4135\n",
      "Iteration: 1860, Train loss: -1.5645, rewards: 0.3510\n",
      "Iteration: 1865, Train loss: -1.4890, rewards: 0.3760\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1870, Train loss: -1.5945, rewards: 0.3668\n",
      "Iteration: 1875, Train loss: -1.6347, rewards: 0.4094\n",
      "Iteration: 1880, Train loss: -1.5602, rewards: 0.3942\n",
      "Iteration: 1885, Train loss: -1.5435, rewards: 0.3749\n",
      "Iteration: 1890, Train loss: -1.4913, rewards: 0.3758\n",
      "Iteration: 1895, Train loss: -1.5204, rewards: 0.3884\n",
      "Iteration: 1900, Train loss: -1.6010, rewards: 0.3515\n",
      "Eval:\n",
      "Hits@1: 0.3929, Hits@3: 0.4055, Hits@10: 0.4475, MRR: 0.4052\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -1.5570, rewards: 0.3667\n",
      "Iteration: 1910, Train loss: -1.5372, rewards: 0.3647\n",
      "Iteration: 1915, Train loss: -1.6173, rewards: 0.3433\n",
      "Iteration: 1920, Train loss: -1.5699, rewards: 0.3776\n",
      "Iteration: 1925, Train loss: -1.5705, rewards: 0.3580\n",
      "Iteration: 1930, Train loss: -1.5794, rewards: 0.3671\n",
      "Iteration: 1935, Train loss: -1.4912, rewards: 0.3913\n",
      "Iteration: 1940, Train loss: -1.5658, rewards: 0.3590\n",
      "Iteration: 1945, Train loss: -1.6120, rewards: 0.3824\n",
      "Iteration: 1950, Train loss: -1.4993, rewards: 0.3539\n",
      "Eval:\n",
      "Hits@1: 0.3529, Hits@3: 0.3803, Hits@10: 0.4265, MRR: 0.3742\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -1.5984, rewards: 0.3992\n",
      "Iteration: 1960, Train loss: -1.5339, rewards: 0.3733\n",
      "Iteration: 1965, Train loss: -1.4762, rewards: 0.4227\n",
      "Iteration: 1970, Train loss: -1.5319, rewards: 0.4012\n",
      "Iteration: 1975, Train loss: -1.5236, rewards: 0.3561\n",
      "Iteration: 1980, Train loss: -1.5750, rewards: 0.3909\n",
      "Iteration: 1985, Train loss: -1.5798, rewards: 0.3899\n",
      "Iteration: 1990, Train loss: -1.5750, rewards: 0.3889\n",
      "Iteration: 1995, Train loss: -1.5368, rewards: 0.3660\n",
      "Iteration: 2000, Train loss: -1.5561, rewards: 0.4016\n",
      "Eval:\n",
      "Hits@1: 0.4160, Hits@3: 0.4349, Hits@10: 0.4601, MRR: 0.4279\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/organizationhiredperson//test_beam/ ]\n",
      "Hits@1: 0.4959, Hits@3: 0.5864, Hits@10: 0.6379, MRR: 0.5464\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.8742671135530456 (349 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-29 21:48:11,846]\u001b[0m Trial 0 finished with value: 0.8742671135530456 and parameters: {'lr': 0.0006368906270844632, 'bs': 97, 'b': 0.4072149665331217, 'l': 0.01829587007748107, 'ee': 50}. Best is trial 0 with value: 0.8742671135530456.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.6800, rewards: 0.1062\n",
      "Iteration: 10, Train loss: -0.7012, rewards: 0.1346\n",
      "Iteration: 15, Train loss: -0.7961, rewards: 0.1246\n",
      "Iteration: 20, Train loss: -0.8673, rewards: 0.2183\n",
      "Iteration: 25, Train loss: -0.8735, rewards: 0.1700\n",
      "Iteration: 30, Train loss: -0.7766, rewards: 0.1971\n",
      "Iteration: 35, Train loss: -0.9395, rewards: 0.2075\n",
      "Iteration: 40, Train loss: -0.9124, rewards: 0.2358\n",
      "Iteration: 45, Train loss: -0.8856, rewards: 0.1879\n",
      "Iteration: 50, Train loss: -0.8484, rewards: 0.2467\n",
      "Eval:\n",
      "Hits@1: 0.3845, Hits@3: 0.4517, Hits@10: 0.4811, MRR: 0.4201\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.8435, rewards: 0.2387\n",
      "Iteration: 60, Train loss: -0.8342, rewards: 0.2554\n",
      "Iteration: 65, Train loss: -0.8244, rewards: 0.2787\n",
      "Iteration: 70, Train loss: -0.9108, rewards: 0.2450\n",
      "Iteration: 75, Train loss: -0.8746, rewards: 0.2717\n",
      "Iteration: 80, Train loss: -0.9403, rewards: 0.2996\n",
      "Iteration: 85, Train loss: -0.9198, rewards: 0.3275\n",
      "Iteration: 90, Train loss: -0.8963, rewards: 0.3254\n",
      "Iteration: 95, Train loss: -0.9225, rewards: 0.2817\n",
      "Iteration: 100, Train loss: -0.9077, rewards: 0.2646\n",
      "Eval:\n",
      "Hits@1: 0.4055, Hits@3: 0.4517, Hits@10: 0.4727, MRR: 0.4304\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.7858, rewards: 0.3317\n",
      "Iteration: 110, Train loss: -0.9118, rewards: 0.3558\n",
      "Iteration: 115, Train loss: -0.9429, rewards: 0.3746\n",
      "Iteration: 120, Train loss: -0.8842, rewards: 0.3333\n",
      "Iteration: 125, Train loss: -0.9806, rewards: 0.3483\n",
      "Iteration: 130, Train loss: -0.7697, rewards: 0.3246\n",
      "Iteration: 135, Train loss: -0.8028, rewards: 0.3454\n",
      "Iteration: 140, Train loss: -1.0096, rewards: 0.3117\n",
      "Iteration: 145, Train loss: -0.7921, rewards: 0.4000\n",
      "Iteration: 150, Train loss: -0.8434, rewards: 0.3329\n",
      "Eval:\n",
      "Hits@1: 0.4265, Hits@3: 0.4643, Hits@10: 0.4853, MRR: 0.4492\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.9221, rewards: 0.3146\n",
      "Iteration: 160, Train loss: -0.9048, rewards: 0.3688\n",
      "Iteration: 165, Train loss: -0.8707, rewards: 0.3525\n",
      "Iteration: 170, Train loss: -0.7789, rewards: 0.3321\n",
      "Iteration: 175, Train loss: -0.9215, rewards: 0.3983\n",
      "Iteration: 180, Train loss: -0.9302, rewards: 0.3671\n",
      "Iteration: 185, Train loss: -0.8743, rewards: 0.4008\n",
      "Iteration: 190, Train loss: -0.9084, rewards: 0.4171\n",
      "Iteration: 195, Train loss: -0.8753, rewards: 0.3992\n",
      "Iteration: 200, Train loss: -0.8061, rewards: 0.3821\n",
      "Eval:\n",
      "Hits@1: 0.4454, Hits@3: 0.4706, Hits@10: 0.4853, MRR: 0.4600\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.9205, rewards: 0.3958\n",
      "Iteration: 210, Train loss: -0.8634, rewards: 0.2925\n",
      "Iteration: 215, Train loss: -0.9645, rewards: 0.3967\n",
      "Iteration: 220, Train loss: -0.7618, rewards: 0.3629\n",
      "Iteration: 225, Train loss: -0.9024, rewards: 0.4113\n",
      "Iteration: 230, Train loss: -0.9342, rewards: 0.3079\n",
      "Iteration: 235, Train loss: -0.8198, rewards: 0.3942\n",
      "Iteration: 240, Train loss: -0.8686, rewards: 0.2929\n",
      "Iteration: 245, Train loss: -0.9499, rewards: 0.3858\n",
      "Iteration: 250, Train loss: -0.8747, rewards: 0.4358\n",
      "Eval:\n",
      "Hits@1: 0.4433, Hits@3: 0.4685, Hits@10: 0.4790, MRR: 0.4572\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.9143, rewards: 0.3621\n",
      "Iteration: 260, Train loss: -0.8871, rewards: 0.3563\n",
      "Iteration: 265, Train loss: -0.9475, rewards: 0.3262\n",
      "Iteration: 270, Train loss: -0.8801, rewards: 0.3337\n",
      "Iteration: 275, Train loss: -0.9331, rewards: 0.3417\n",
      "Iteration: 280, Train loss: -0.9292, rewards: 0.4275\n",
      "Iteration: 285, Train loss: -0.7532, rewards: 0.4321\n",
      "Iteration: 290, Train loss: -0.8109, rewards: 0.3317\n",
      "Iteration: 295, Train loss: -1.0148, rewards: 0.4108\n",
      "Iteration: 300, Train loss: -0.8862, rewards: 0.3979\n",
      "Eval:\n",
      "Hits@1: 0.4517, Hits@3: 0.4643, Hits@10: 0.4769, MRR: 0.4597\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.8499, rewards: 0.4317\n",
      "Iteration: 310, Train loss: -0.9098, rewards: 0.3700\n",
      "Iteration: 315, Train loss: -1.0098, rewards: 0.3842\n",
      "Iteration: 320, Train loss: -0.9531, rewards: 0.3975\n",
      "Iteration: 325, Train loss: -0.8771, rewards: 0.4004\n",
      "Iteration: 330, Train loss: -0.9128, rewards: 0.4121\n",
      "Iteration: 335, Train loss: -0.9954, rewards: 0.3329\n",
      "Iteration: 340, Train loss: -0.9569, rewards: 0.3254\n",
      "Iteration: 345, Train loss: -0.9449, rewards: 0.4392\n",
      "Iteration: 350, Train loss: -0.9780, rewards: 0.4296\n",
      "Eval:\n",
      "Hits@1: 0.4517, Hits@3: 0.4685, Hits@10: 0.4916, MRR: 0.4625\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -0.9742, rewards: 0.3771\n",
      "Iteration: 360, Train loss: -1.0031, rewards: 0.4404\n",
      "Iteration: 365, Train loss: -0.8454, rewards: 0.4417\n",
      "Iteration: 370, Train loss: -0.8159, rewards: 0.3046\n",
      "Iteration: 375, Train loss: -0.8703, rewards: 0.3450\n",
      "Iteration: 380, Train loss: -0.8856, rewards: 0.3492\n",
      "Iteration: 385, Train loss: -0.8913, rewards: 0.3571\n",
      "Iteration: 390, Train loss: -0.9005, rewards: 0.3929\n",
      "Iteration: 395, Train loss: -0.9407, rewards: 0.3729\n",
      "Iteration: 400, Train loss: -0.8617, rewards: 0.4004\n",
      "Eval:\n",
      "Hits@1: 0.4538, Hits@3: 0.4685, Hits@10: 0.4832, MRR: 0.4629\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -0.8319, rewards: 0.3879\n",
      "Iteration: 410, Train loss: -0.7917, rewards: 0.4446\n",
      "Iteration: 415, Train loss: -0.8538, rewards: 0.4817\n",
      "Iteration: 420, Train loss: -0.8508, rewards: 0.3387\n",
      "Iteration: 425, Train loss: -0.9511, rewards: 0.4267\n",
      "Iteration: 430, Train loss: -0.7854, rewards: 0.4929\n",
      "Iteration: 435, Train loss: -0.9783, rewards: 0.4221\n",
      "Iteration: 440, Train loss: -0.8899, rewards: 0.3812\n",
      "Iteration: 445, Train loss: -0.8057, rewards: 0.3421\n",
      "Iteration: 450, Train loss: -0.9815, rewards: 0.3925\n",
      "Eval:\n",
      "Hits@1: 0.4391, Hits@3: 0.4706, Hits@10: 0.4853, MRR: 0.4574\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -0.9479, rewards: 0.4142\n",
      "Iteration: 460, Train loss: -0.9611, rewards: 0.3417\n",
      "Iteration: 465, Train loss: -0.9118, rewards: 0.4254\n",
      "Iteration: 470, Train loss: -0.9945, rewards: 0.4229\n",
      "Iteration: 475, Train loss: -0.9178, rewards: 0.4771\n",
      "Iteration: 480, Train loss: -0.8306, rewards: 0.3013\n",
      "Iteration: 485, Train loss: -1.0982, rewards: 0.3567\n",
      "Iteration: 490, Train loss: -0.8686, rewards: 0.3758\n",
      "Iteration: 495, Train loss: -0.9507, rewards: 0.4542\n",
      "Iteration: 500, Train loss: -1.0489, rewards: 0.4275\n",
      "Eval:\n",
      "Hits@1: 0.4496, Hits@3: 0.4727, Hits@10: 0.4811, MRR: 0.4618\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -0.9084, rewards: 0.3933\n",
      "Iteration: 510, Train loss: -0.8074, rewards: 0.3433\n",
      "Iteration: 515, Train loss: -0.9970, rewards: 0.5308\n",
      "Iteration: 520, Train loss: -0.7983, rewards: 0.4571\n",
      "Iteration: 525, Train loss: -0.9358, rewards: 0.4358\n",
      "Iteration: 530, Train loss: -0.9775, rewards: 0.3779\n",
      "Iteration: 535, Train loss: -0.8608, rewards: 0.4758\n",
      "Iteration: 540, Train loss: -0.9387, rewards: 0.4625\n",
      "Iteration: 545, Train loss: -0.9516, rewards: 0.3400\n",
      "Iteration: 550, Train loss: -0.9667, rewards: 0.3212\n",
      "Eval:\n",
      "Hits@1: 0.4160, Hits@3: 0.4643, Hits@10: 0.4769, MRR: 0.4387\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -1.0144, rewards: 0.3508\n",
      "Iteration: 560, Train loss: -1.0032, rewards: 0.4146\n",
      "Iteration: 565, Train loss: -1.0696, rewards: 0.4879\n",
      "Iteration: 570, Train loss: -1.0072, rewards: 0.3679\n",
      "Iteration: 575, Train loss: -0.9917, rewards: 0.3550\n",
      "Iteration: 580, Train loss: -0.9894, rewards: 0.4158\n",
      "Iteration: 585, Train loss: -0.9705, rewards: 0.4225\n",
      "Iteration: 590, Train loss: -0.8894, rewards: 0.4371\n",
      "Iteration: 595, Train loss: -0.9368, rewards: 0.4396\n",
      "Iteration: 600, Train loss: -0.9445, rewards: 0.3779\n",
      "Eval:\n",
      "Hits@1: 0.4496, Hits@3: 0.4706, Hits@10: 0.4832, MRR: 0.4628\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -1.0034, rewards: 0.4079\n",
      "Iteration: 610, Train loss: -1.0022, rewards: 0.3758\n",
      "Iteration: 615, Train loss: -1.0240, rewards: 0.3483\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -0.9792, rewards: 0.4654\n",
      "Iteration: 625, Train loss: -0.9595, rewards: 0.4096\n",
      "Iteration: 630, Train loss: -0.9251, rewards: 0.4646\n",
      "Iteration: 635, Train loss: -1.0534, rewards: 0.4321\n",
      "Iteration: 640, Train loss: -1.0234, rewards: 0.4571\n",
      "Iteration: 645, Train loss: -0.9305, rewards: 0.4471\n",
      "Iteration: 650, Train loss: -0.9132, rewards: 0.2992\n",
      "Eval:\n",
      "Hits@1: 0.4391, Hits@3: 0.4664, Hits@10: 0.4790, MRR: 0.4557\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -1.0571, rewards: 0.3513\n",
      "Iteration: 660, Train loss: -0.9050, rewards: 0.3829\n",
      "Iteration: 665, Train loss: -0.9819, rewards: 0.5100\n",
      "Iteration: 670, Train loss: -0.9955, rewards: 0.3817\n",
      "Iteration: 675, Train loss: -1.0386, rewards: 0.3571\n",
      "Iteration: 680, Train loss: -0.8382, rewards: 0.4704\n",
      "Iteration: 685, Train loss: -0.9874, rewards: 0.3942\n",
      "Iteration: 690, Train loss: -1.0530, rewards: 0.4071\n",
      "Iteration: 695, Train loss: -1.0281, rewards: 0.4346\n",
      "Iteration: 700, Train loss: -0.8964, rewards: 0.4204\n",
      "Eval:\n",
      "Hits@1: 0.4517, Hits@3: 0.4643, Hits@10: 0.4769, MRR: 0.4595\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -0.8737, rewards: 0.4654\n",
      "Iteration: 710, Train loss: -1.1062, rewards: 0.3904\n",
      "Iteration: 715, Train loss: -1.0105, rewards: 0.4329\n",
      "Iteration: 720, Train loss: -1.0293, rewards: 0.4279\n",
      "Iteration: 725, Train loss: -1.0292, rewards: 0.3862\n",
      "Iteration: 730, Train loss: -0.9747, rewards: 0.4958\n",
      "Iteration: 735, Train loss: -1.1015, rewards: 0.5025\n",
      "Iteration: 740, Train loss: -0.8153, rewards: 0.3696\n",
      "Iteration: 745, Train loss: -1.1119, rewards: 0.4000\n",
      "Iteration: 750, Train loss: -1.0196, rewards: 0.3663\n",
      "Eval:\n",
      "Hits@1: 0.4349, Hits@3: 0.4559, Hits@10: 0.4769, MRR: 0.4489\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.9325, rewards: 0.3783\n",
      "Iteration: 760, Train loss: -1.0060, rewards: 0.4167\n",
      "Iteration: 765, Train loss: -1.1050, rewards: 0.3892\n",
      "Iteration: 770, Train loss: -1.0106, rewards: 0.3600\n",
      "Iteration: 775, Train loss: -1.1254, rewards: 0.3629\n",
      "Iteration: 780, Train loss: -0.8005, rewards: 0.4883\n",
      "Iteration: 785, Train loss: -1.0581, rewards: 0.4412\n",
      "Iteration: 790, Train loss: -1.0128, rewards: 0.4721\n",
      "Iteration: 795, Train loss: -0.9942, rewards: 0.3212\n",
      "Iteration: 800, Train loss: -1.0640, rewards: 0.3629\n",
      "Eval:\n",
      "Hits@1: 0.4097, Hits@3: 0.4706, Hits@10: 0.4790, MRR: 0.4387\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -1.0316, rewards: 0.4558\n",
      "Iteration: 810, Train loss: -1.1410, rewards: 0.4462\n",
      "Iteration: 815, Train loss: -0.9585, rewards: 0.4450\n",
      "Iteration: 820, Train loss: -0.9299, rewards: 0.4171\n",
      "Iteration: 825, Train loss: -1.0850, rewards: 0.3696\n",
      "Iteration: 830, Train loss: -1.0591, rewards: 0.4675\n",
      "Iteration: 835, Train loss: -1.1503, rewards: 0.4763\n",
      "Iteration: 840, Train loss: -1.0432, rewards: 0.3558\n",
      "Iteration: 845, Train loss: -1.0827, rewards: 0.4325\n",
      "Iteration: 850, Train loss: -1.1409, rewards: 0.4758\n",
      "Eval:\n",
      "Hits@1: 0.4328, Hits@3: 0.4643, Hits@10: 0.4790, MRR: 0.4502\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -1.1006, rewards: 0.4279\n",
      "Iteration: 860, Train loss: -1.0083, rewards: 0.3638\n",
      "Iteration: 865, Train loss: -1.1289, rewards: 0.4350\n",
      "Iteration: 870, Train loss: -0.9639, rewards: 0.3804\n",
      "Iteration: 875, Train loss: -1.0016, rewards: 0.4921\n",
      "Iteration: 880, Train loss: -0.9980, rewards: 0.4058\n",
      "Iteration: 885, Train loss: -1.0931, rewards: 0.4363\n",
      "Iteration: 890, Train loss: -1.0536, rewards: 0.4571\n",
      "Iteration: 895, Train loss: -1.0236, rewards: 0.4567\n",
      "Iteration: 900, Train loss: -0.9006, rewards: 0.4400\n",
      "Eval:\n",
      "Hits@1: 0.4307, Hits@3: 0.4559, Hits@10: 0.4769, MRR: 0.4461\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -1.0398, rewards: 0.3704\n",
      "Iteration: 910, Train loss: -1.1115, rewards: 0.4412\n",
      "Iteration: 915, Train loss: -1.0903, rewards: 0.4817\n",
      "Iteration: 920, Train loss: -1.2093, rewards: 0.4238\n",
      "Iteration: 925, Train loss: -1.0792, rewards: 0.4696\n",
      "Iteration: 930, Train loss: -1.0632, rewards: 0.4821\n",
      "Iteration: 935, Train loss: -1.1016, rewards: 0.4512\n",
      "Iteration: 940, Train loss: -1.0904, rewards: 0.3675\n",
      "Iteration: 945, Train loss: -1.1350, rewards: 0.4688\n",
      "Iteration: 950, Train loss: -0.9576, rewards: 0.4829\n",
      "Eval:\n",
      "Hits@1: 0.4265, Hits@3: 0.4496, Hits@10: 0.4685, MRR: 0.4421\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -1.1361, rewards: 0.3496\n",
      "Iteration: 960, Train loss: -1.1919, rewards: 0.4725\n",
      "Iteration: 965, Train loss: -1.1719, rewards: 0.4396\n",
      "Iteration: 970, Train loss: -1.1295, rewards: 0.4471\n",
      "Iteration: 975, Train loss: -1.0748, rewards: 0.4196\n",
      "Iteration: 980, Train loss: -1.0010, rewards: 0.4917\n",
      "Iteration: 985, Train loss: -1.0759, rewards: 0.4037\n",
      "Iteration: 990, Train loss: -1.0988, rewards: 0.4546\n",
      "Iteration: 995, Train loss: -1.0712, rewards: 0.4263\n",
      "Iteration: 1000, Train loss: -0.9612, rewards: 0.3862\n",
      "Eval:\n",
      "Hits@1: 0.4265, Hits@3: 0.4538, Hits@10: 0.4769, MRR: 0.4418\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -0.9981, rewards: 0.4158\n",
      "Iteration: 1010, Train loss: -1.0304, rewards: 0.4433\n",
      "Iteration: 1015, Train loss: -1.0704, rewards: 0.4529\n",
      "Iteration: 1020, Train loss: -1.0578, rewards: 0.4675\n",
      "Iteration: 1025, Train loss: -1.0573, rewards: 0.4054\n",
      "Iteration: 1030, Train loss: -1.0256, rewards: 0.3783\n",
      "Iteration: 1035, Train loss: -1.0147, rewards: 0.4300\n",
      "Iteration: 1040, Train loss: -1.0838, rewards: 0.3392\n",
      "Iteration: 1045, Train loss: -1.0036, rewards: 0.3896\n",
      "Iteration: 1050, Train loss: -1.0630, rewards: 0.4387\n",
      "Eval:\n",
      "Hits@1: 0.4370, Hits@3: 0.4601, Hits@10: 0.4727, MRR: 0.4506\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -1.0415, rewards: 0.4429\n",
      "Iteration: 1060, Train loss: -1.1197, rewards: 0.3871\n",
      "Iteration: 1065, Train loss: -1.0865, rewards: 0.4567\n",
      "Iteration: 1070, Train loss: -1.1222, rewards: 0.3663\n",
      "Iteration: 1075, Train loss: -1.0379, rewards: 0.4108\n",
      "Iteration: 1080, Train loss: -0.9783, rewards: 0.4163\n",
      "Iteration: 1085, Train loss: -0.9890, rewards: 0.4529\n",
      "Iteration: 1090, Train loss: -1.1230, rewards: 0.4808\n",
      "Iteration: 1095, Train loss: -0.9247, rewards: 0.4567\n",
      "Iteration: 1100, Train loss: -1.1173, rewards: 0.3937\n",
      "Eval:\n",
      "Hits@1: 0.3929, Hits@3: 0.4370, Hits@10: 0.4559, MRR: 0.4161\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.9507, rewards: 0.3033\n",
      "Iteration: 1110, Train loss: -0.9268, rewards: 0.3721\n",
      "Iteration: 1115, Train loss: -1.0058, rewards: 0.2167\n",
      "Iteration: 1120, Train loss: -1.0203, rewards: 0.2754\n",
      "Iteration: 1125, Train loss: -0.9809, rewards: 0.2275\n",
      "Iteration: 1130, Train loss: -1.0520, rewards: 0.2667\n",
      "Iteration: 1135, Train loss: -1.0360, rewards: 0.3408\n",
      "Iteration: 1140, Train loss: -0.9794, rewards: 0.2758\n",
      "Iteration: 1145, Train loss: -1.1272, rewards: 0.3033\n",
      "Iteration: 1150, Train loss: -1.0683, rewards: 0.3421\n",
      "Eval:\n",
      "Hits@1: 0.4097, Hits@3: 0.4307, Hits@10: 0.4433, MRR: 0.4222\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -1.0708, rewards: 0.2946\n",
      "Iteration: 1160, Train loss: -1.0257, rewards: 0.3008\n",
      "Iteration: 1165, Train loss: -0.9830, rewards: 0.2425\n",
      "Iteration: 1170, Train loss: -1.0452, rewards: 0.3479\n",
      "Iteration: 1175, Train loss: -1.0026, rewards: 0.2829\n",
      "Iteration: 1180, Train loss: -1.0988, rewards: 0.3575\n",
      "Iteration: 1185, Train loss: -1.0295, rewards: 0.2737\n",
      "Iteration: 1190, Train loss: -1.0190, rewards: 0.3454\n",
      "Iteration: 1195, Train loss: -0.9762, rewards: 0.3975\n",
      "Iteration: 1200, Train loss: -0.9790, rewards: 0.4017\n",
      "Eval:\n",
      "Hits@1: 0.4370, Hits@3: 0.4580, Hits@10: 0.4748, MRR: 0.4509\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -1.0802, rewards: 0.4142\n",
      "Iteration: 1210, Train loss: -0.9695, rewards: 0.3929\n",
      "Iteration: 1215, Train loss: -1.0609, rewards: 0.3937\n",
      "Iteration: 1220, Train loss: -0.7908, rewards: 0.3004\n",
      "Iteration: 1225, Train loss: -0.9810, rewards: 0.4283\n",
      "Iteration: 1230, Train loss: -0.7927, rewards: 0.4404\n",
      "Iteration: 1235, Train loss: -1.0641, rewards: 0.4125\n",
      "Iteration: 1240, Train loss: -1.0613, rewards: 0.3771\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -1.0543, rewards: 0.4213\n",
      "Iteration: 1250, Train loss: -0.8988, rewards: 0.4875\n",
      "Eval:\n",
      "Hits@1: 0.4370, Hits@3: 0.4685, Hits@10: 0.4874, MRR: 0.4557\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -0.9529, rewards: 0.4408\n",
      "Iteration: 1260, Train loss: -0.9356, rewards: 0.2733\n",
      "Iteration: 1265, Train loss: -0.9533, rewards: 0.3700\n",
      "Iteration: 1270, Train loss: -0.9483, rewards: 0.5458\n",
      "Iteration: 1275, Train loss: -0.9350, rewards: 0.4075\n",
      "Iteration: 1280, Train loss: -0.9404, rewards: 0.4075\n",
      "Iteration: 1285, Train loss: -0.9057, rewards: 0.3442\n",
      "Iteration: 1290, Train loss: -1.0153, rewards: 0.4271\n",
      "Iteration: 1295, Train loss: -0.9522, rewards: 0.4288\n",
      "Iteration: 1300, Train loss: -0.9253, rewards: 0.3450\n",
      "Eval:\n",
      "Hits@1: 0.4412, Hits@3: 0.4706, Hits@10: 0.4832, MRR: 0.4561\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -1.0189, rewards: 0.3929\n",
      "Iteration: 1310, Train loss: -1.0670, rewards: 0.4813\n",
      "Iteration: 1315, Train loss: -1.1017, rewards: 0.4813\n",
      "Iteration: 1320, Train loss: -0.8518, rewards: 0.4071\n",
      "Iteration: 1325, Train loss: -0.9182, rewards: 0.3987\n",
      "Iteration: 1330, Train loss: -0.9981, rewards: 0.3542\n",
      "Iteration: 1335, Train loss: -0.9452, rewards: 0.4767\n",
      "Iteration: 1340, Train loss: -0.9104, rewards: 0.4346\n",
      "Iteration: 1345, Train loss: -0.8412, rewards: 0.4242\n",
      "Iteration: 1350, Train loss: -1.0090, rewards: 0.4571\n",
      "Eval:\n",
      "Hits@1: 0.4517, Hits@3: 0.4706, Hits@10: 0.4895, MRR: 0.4636\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -1.1468, rewards: 0.3792\n",
      "Iteration: 1360, Train loss: -1.1488, rewards: 0.4033\n",
      "Iteration: 1365, Train loss: -0.9607, rewards: 0.4783\n",
      "Iteration: 1370, Train loss: -0.9817, rewards: 0.4079\n",
      "Iteration: 1375, Train loss: -1.0154, rewards: 0.3650\n",
      "Iteration: 1380, Train loss: -1.0619, rewards: 0.4304\n",
      "Iteration: 1385, Train loss: -0.8982, rewards: 0.4254\n",
      "Iteration: 1390, Train loss: -0.9084, rewards: 0.4217\n",
      "Iteration: 1395, Train loss: -1.0250, rewards: 0.4487\n",
      "Iteration: 1400, Train loss: -0.9876, rewards: 0.4783\n",
      "Eval:\n",
      "Hits@1: 0.4496, Hits@3: 0.4664, Hits@10: 0.4895, MRR: 0.4601\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -1.0332, rewards: 0.4283\n",
      "Iteration: 1410, Train loss: -1.0332, rewards: 0.3942\n",
      "Iteration: 1415, Train loss: -0.9870, rewards: 0.4350\n",
      "Iteration: 1420, Train loss: -1.0360, rewards: 0.4537\n",
      "Iteration: 1425, Train loss: -1.0246, rewards: 0.3996\n",
      "Iteration: 1430, Train loss: -0.9798, rewards: 0.4067\n",
      "Iteration: 1435, Train loss: -0.9242, rewards: 0.4738\n",
      "Iteration: 1440, Train loss: -1.0377, rewards: 0.4387\n",
      "Iteration: 1445, Train loss: -1.0222, rewards: 0.3688\n",
      "Iteration: 1450, Train loss: -1.0630, rewards: 0.5067\n",
      "Eval:\n",
      "Hits@1: 0.4538, Hits@3: 0.4685, Hits@10: 0.4790, MRR: 0.4615\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -1.0399, rewards: 0.4133\n",
      "Iteration: 1460, Train loss: -0.9669, rewards: 0.4913\n",
      "Iteration: 1465, Train loss: -1.0391, rewards: 0.3850\n",
      "Iteration: 1470, Train loss: -0.9461, rewards: 0.3933\n",
      "Iteration: 1475, Train loss: -1.0358, rewards: 0.4537\n",
      "Iteration: 1480, Train loss: -0.9463, rewards: 0.4288\n",
      "Iteration: 1485, Train loss: -1.0247, rewards: 0.4421\n",
      "Iteration: 1490, Train loss: -1.0430, rewards: 0.4596\n",
      "Iteration: 1495, Train loss: -0.9565, rewards: 0.4329\n",
      "Iteration: 1500, Train loss: -1.0446, rewards: 0.3933\n",
      "Eval:\n",
      "Hits@1: 0.4517, Hits@3: 0.4727, Hits@10: 0.4811, MRR: 0.4630\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -1.0385, rewards: 0.3471\n",
      "Iteration: 1510, Train loss: -0.9798, rewards: 0.4462\n",
      "Iteration: 1515, Train loss: -1.0552, rewards: 0.4192\n",
      "Iteration: 1520, Train loss: -1.0245, rewards: 0.4600\n",
      "Iteration: 1525, Train loss: -1.0257, rewards: 0.4733\n",
      "Iteration: 1530, Train loss: -1.1216, rewards: 0.4496\n",
      "Iteration: 1535, Train loss: -1.1504, rewards: 0.4358\n",
      "Iteration: 1540, Train loss: -0.9397, rewards: 0.4371\n",
      "Iteration: 1545, Train loss: -0.9143, rewards: 0.5079\n",
      "Iteration: 1550, Train loss: -0.9983, rewards: 0.3929\n",
      "Eval:\n",
      "Hits@1: 0.4349, Hits@3: 0.4622, Hits@10: 0.4811, MRR: 0.4501\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.9985, rewards: 0.2904\n",
      "Iteration: 1560, Train loss: -1.1120, rewards: 0.3654\n",
      "Iteration: 1565, Train loss: -1.1207, rewards: 0.4163\n",
      "Iteration: 1570, Train loss: -1.0933, rewards: 0.3829\n",
      "Iteration: 1575, Train loss: -1.0374, rewards: 0.4175\n",
      "Iteration: 1580, Train loss: -0.9573, rewards: 0.4746\n",
      "Iteration: 1585, Train loss: -0.8907, rewards: 0.5021\n",
      "Iteration: 1590, Train loss: -1.0379, rewards: 0.3658\n",
      "Iteration: 1595, Train loss: -1.0631, rewards: 0.4383\n",
      "Iteration: 1600, Train loss: -1.0211, rewards: 0.4142\n",
      "Eval:\n",
      "Hits@1: 0.4433, Hits@3: 0.4664, Hits@10: 0.4811, MRR: 0.4566\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.9131, rewards: 0.5125\n",
      "Iteration: 1610, Train loss: -0.9134, rewards: 0.4492\n",
      "Iteration: 1615, Train loss: -0.9651, rewards: 0.4542\n",
      "Iteration: 1620, Train loss: -1.0081, rewards: 0.4483\n",
      "Iteration: 1625, Train loss: -1.0574, rewards: 0.4662\n",
      "Iteration: 1630, Train loss: -0.9304, rewards: 0.4150\n",
      "Iteration: 1635, Train loss: -0.8347, rewards: 0.4713\n",
      "Iteration: 1640, Train loss: -0.9872, rewards: 0.4692\n",
      "Iteration: 1645, Train loss: -1.0857, rewards: 0.3925\n",
      "Iteration: 1650, Train loss: -1.0411, rewards: 0.4929\n",
      "Eval:\n",
      "Hits@1: 0.4559, Hits@3: 0.4790, Hits@10: 0.4874, MRR: 0.4679\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -1.0826, rewards: 0.4129\n",
      "Iteration: 1660, Train loss: -0.9957, rewards: 0.3713\n",
      "Iteration: 1665, Train loss: -0.9215, rewards: 0.4083\n",
      "Iteration: 1670, Train loss: -0.9953, rewards: 0.3404\n",
      "Iteration: 1675, Train loss: -0.9900, rewards: 0.3700\n",
      "Iteration: 1680, Train loss: -1.0506, rewards: 0.4217\n",
      "Iteration: 1685, Train loss: -1.1193, rewards: 0.3742\n",
      "Iteration: 1690, Train loss: -1.1363, rewards: 0.4533\n",
      "Iteration: 1695, Train loss: -1.0880, rewards: 0.4442\n",
      "Iteration: 1700, Train loss: -1.0367, rewards: 0.3554\n",
      "Eval:\n",
      "Hits@1: 0.4601, Hits@3: 0.4748, Hits@10: 0.4916, MRR: 0.4697\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -1.0296, rewards: 0.4521\n",
      "Iteration: 1710, Train loss: -0.9906, rewards: 0.3783\n",
      "Iteration: 1715, Train loss: -1.0619, rewards: 0.4304\n",
      "Iteration: 1720, Train loss: -0.8597, rewards: 0.5296\n",
      "Iteration: 1725, Train loss: -1.0122, rewards: 0.4608\n",
      "Iteration: 1730, Train loss: -0.8920, rewards: 0.4713\n",
      "Iteration: 1735, Train loss: -0.9441, rewards: 0.4121\n",
      "Iteration: 1740, Train loss: -1.0627, rewards: 0.4925\n",
      "Iteration: 1745, Train loss: -1.0430, rewards: 0.4225\n",
      "Iteration: 1750, Train loss: -1.0901, rewards: 0.4437\n",
      "Eval:\n",
      "Hits@1: 0.4601, Hits@3: 0.4706, Hits@10: 0.4832, MRR: 0.4662\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.9225, rewards: 0.3854\n",
      "Iteration: 1760, Train loss: -0.9372, rewards: 0.3762\n",
      "Iteration: 1765, Train loss: -0.9717, rewards: 0.4254\n",
      "Iteration: 1770, Train loss: -1.0360, rewards: 0.3529\n",
      "Iteration: 1775, Train loss: -0.8957, rewards: 0.4529\n",
      "Iteration: 1780, Train loss: -1.0125, rewards: 0.4833\n",
      "Iteration: 1785, Train loss: -0.8373, rewards: 0.5346\n",
      "Iteration: 1790, Train loss: -1.0031, rewards: 0.3617\n",
      "Iteration: 1795, Train loss: -1.1191, rewards: 0.4954\n",
      "Iteration: 1800, Train loss: -0.9877, rewards: 0.4104\n",
      "Eval:\n",
      "Hits@1: 0.4496, Hits@3: 0.4685, Hits@10: 0.4874, MRR: 0.4610\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -0.9946, rewards: 0.4021\n",
      "Iteration: 1810, Train loss: -0.9431, rewards: 0.4254\n",
      "Iteration: 1815, Train loss: -0.9851, rewards: 0.4121\n",
      "Iteration: 1820, Train loss: -0.8705, rewards: 0.3696\n",
      "Iteration: 1825, Train loss: -1.0766, rewards: 0.3850\n",
      "Iteration: 1830, Train loss: -0.9576, rewards: 0.3942\n",
      "Iteration: 1835, Train loss: -0.9446, rewards: 0.4500\n",
      "Iteration: 1840, Train loss: -0.9154, rewards: 0.4054\n",
      "Iteration: 1845, Train loss: -1.0308, rewards: 0.4688\n",
      "Iteration: 1850, Train loss: -1.0181, rewards: 0.4554\n",
      "Eval:\n",
      "Hits@1: 0.4475, Hits@3: 0.4706, Hits@10: 0.4811, MRR: 0.4598\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -0.9310, rewards: 0.5296\n",
      "Iteration: 1860, Train loss: -1.1249, rewards: 0.4567\n",
      "Iteration: 1865, Train loss: -1.0324, rewards: 0.3942\n",
      "Iteration: 1870, Train loss: -1.0878, rewards: 0.4688\n",
      "Iteration: 1875, Train loss: -1.0175, rewards: 0.4717\n",
      "Iteration: 1880, Train loss: -1.1047, rewards: 0.4888\n",
      "Iteration: 1885, Train loss: -1.1583, rewards: 0.4596\n",
      "Iteration: 1890, Train loss: -1.0754, rewards: 0.4208\n",
      "Iteration: 1895, Train loss: -1.0195, rewards: 0.3783\n",
      "Iteration: 1900, Train loss: -1.0891, rewards: 0.4508\n",
      "Eval:\n",
      "Hits@1: 0.4496, Hits@3: 0.4769, Hits@10: 0.4916, MRR: 0.4648\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -0.9930, rewards: 0.4658\n",
      "Iteration: 1910, Train loss: -1.0879, rewards: 0.4546\n",
      "Iteration: 1915, Train loss: -0.9512, rewards: 0.5012\n",
      "Iteration: 1920, Train loss: -1.1085, rewards: 0.3579\n",
      "Iteration: 1925, Train loss: -1.1362, rewards: 0.3779\n",
      "Iteration: 1930, Train loss: -1.0750, rewards: 0.4683\n",
      "Iteration: 1935, Train loss: -0.9069, rewards: 0.4575\n",
      "Iteration: 1940, Train loss: -0.9374, rewards: 0.4146\n",
      "Iteration: 1945, Train loss: -1.0911, rewards: 0.4700\n",
      "Iteration: 1950, Train loss: -0.9710, rewards: 0.4508\n",
      "Eval:\n"
     ]
    }
   ],
   "source": [
    "sub_task = sub_tasks_list[0]\n",
    "study = optuna.create_study(storage=f\"sqlite:///{sub_task}.db\", study_name=f\"{sub_task}\", direction = 'maximize')\n",
    "study.optimize(objective, n_trials=1000)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
