{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "b2479ab1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pickle5\n",
    "import pandas as pd\n",
    "import json\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"MIG-12e7197d-4e01-5bc8-aa76-2be6e3a55125\"\n",
    "\n",
    "from model.ours3 import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "a39d5a6b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_params(task = None):\n",
    "    options = {}\n",
    "\n",
    "    #basic setting\n",
    "    task_name = 'nell-995' if task is None else task\n",
    "    \n",
    "    options['use_cuda'] = True\n",
    "    options['vocab_dir'] = '../MINERVA/datasets/data_preprocessed/nell/vocab/'\n",
    "    options['data_input_dir'] = f'../MINERVA/datasets/data_preprocessed/{task_name}/'\n",
    "    options['device'] = 'cuda' if options['use_cuda'] else 'cpu'\n",
    "    options['relation_vocab'] = json.load(open(options['vocab_dir'] + '/relation_vocab.json'))\n",
    "    options['entity_vocab'] = json.load(open(options['vocab_dir'] + '/entity_vocab.json'))\n",
    "    \n",
    "    \n",
    "    if task is None:\n",
    "        options['model_dir'] = './outputs_nell995-1/'\n",
    "        options['output_dir'] = './outputs_nell995-1/'\n",
    "    else:\n",
    "        options['pretrain_model_dir'] = f'./outputs_nell995-1/'\n",
    "        options['model_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        options['output_dir'] = f'./outputs_nell995-1/{task_name}/'\n",
    "        if not os.path.exists(options['output_dir']):\n",
    "            os.makedirs(options['output_dir'])\n",
    "        if not os.path.exists(options['model_dir']):\n",
    "            os.makedirs(options['model_dir'])\n",
    "\n",
    "    #agent setting\n",
    "    options['pretrained_embeddings_relation'] = {}\n",
    "    options['pretrained_embeddings_entity'] = {}\n",
    "    options['embedding_size'] = 50\n",
    "    options['hidden_size'] = 200\n",
    "    options['use_entity_embeddings'] = 1\n",
    "    options['train_entity_embeddings'] = 1\n",
    "    options['train_relation_embeddings'] = 1\n",
    "    options['path_length'] = 3\n",
    "    options['LSTM_layers'] = 1\n",
    "    options['max_num_actions'] = 40\n",
    "    options['gnn_layer'] = 2\n",
    "\n",
    "    #hyperparameters\n",
    "    options['test_rollouts'] = 40\n",
    "    options['num_rollouts'] = 20\n",
    "    options['batch_size'] = 64\n",
    "    options['eval_batch_size'] = 32\n",
    "    options['beta'] = 0.15\n",
    "    options['Lambda'] = 0.15\n",
    "    options['gamma'] = 1\n",
    "    options['positive_reward'] = 1\n",
    "    options['negative_reward'] = 0\n",
    "    options['learning_rate'] = 0.00005\n",
    "    options['grad_clip_norm'] = 100\n",
    "    options['eval_every'] = 5\n",
    "    options['total_iterations'] = 20*(64/options['batch_size'])\n",
    "    options['pool'] = 'max'\n",
    "    \n",
    "    return options"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "12f1b8ba",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "Contains full graph\n",
      "batcher loaded\n"
     ]
    }
   ],
   "source": [
    "params = set_params()\n",
    "params['test_rollouts'] = 100\n",
    "params['max_num_actions'] = 100\n",
    "params['eval_batch_size'] = 8\n",
    "\n",
    "trainer = Trainer(params)\n",
    "trainer.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt'))\n",
    "trainer.agent.eval()\n",
    "\n",
    "save_path = trainer.save_path\n",
    "# path_logger_file = trainer.path_logger_file\n",
    "output_dir = trainer.output_dir\n",
    "path_logger_file = output_dir\n",
    "\n",
    "if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "    os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "trainer.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "    score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "    \n",
    "trainer.test_environment = trainer.test_test_environment\n",
    "test_results = trainer.test(beam=True, print_paths=True, save_model=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "17bc5425",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "AthletePlaysInLeague\n",
      "MINERVA MAP: 0.8207787473535506 (381 queries evaluated)\n",
      "AthletePlaysForTeam \n",
      "MINERVA MAP: 0.6278593427818233 (387 queries evaluated)\n",
      "AthleteHomeStadium \n",
      "MINERVA MAP: 0.572523027000639 (201 queries evaluated)\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8249362244897959 (112 queries evaluated)\n",
      "AthletePlaysSport\n",
      "MINERVA MAP: 0.9319237147595357 (603 queries evaluated)\n",
      "OrganizationHiredPerson\n",
      "MINERVA MAP: 0.9153204137843777 (349 queries evaluated)\n",
      "PersonBornInLocation\n",
      "MINERVA MAP: 0.8065181795751745 (193 queries evaluated)\n",
      "WorksFor.txt\n",
      "MINERVA MAP: 0.8287528177373783 (421 queries evaluated)\n",
      "organizationheadquarteredincity\n",
      "MINERVA MAP: 0.9408317251690747 (249 queries evaluated)\n",
      "PersonLeadsOrganization\n",
      "MINERVA MAP: 0.8386739927983896 (179 queries evaluated)\n"
     ]
    }
   ],
   "source": [
    "sub_tasks_list = ['AthletePlaysInLeague',\n",
    "'AthletePlaysForTeam ',\n",
    "'AthleteHomeStadium ',\n",
    "'TeamPlaysSport',\n",
    "'AthletePlaysSport',\n",
    "'OrganizationHiredPerson',\n",
    "'PersonBornInLocation',\n",
    "'WorksFor',\n",
    "'organizationheadquarteredincity',\n",
    "'PersonLeadsOrganization']\n",
    "    \n",
    "map_list = {}    \n",
    "for sub_task in sub_tasks_list:\n",
    "    trainer.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "    \n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    map_list[sub_task] = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              trainer.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "10a372ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "import optuna\n",
    "from model.ours3 import *\n",
    "global sub_tasks_list\n",
    "\n",
    "\n",
    "sub_tasks_list = [\n",
    "# 'AthletePlaysInLeague',\n",
    "# 'AthletePlaysForTeam ',\n",
    "#'AthleteHomeStadium '\n",
    "'TeamPlaysSport',\n",
    "# 'AthletePlaysSport',\n",
    "# 'OrganizationHiredPerson',\n",
    "# 'PersonBornInLocation',\n",
    "# 'WorksFor',\n",
    "# 'organizationheadquarteredincity',\n",
    "#'PersonLeadsOrganization'\n",
    "]\n",
    "\n",
    "def objective(trial):\n",
    "    \n",
    "    sub_task = sub_tasks_list[0]\n",
    "\n",
    "    lr = trial.suggest_float('lr', 1e-6, 1e-2)\n",
    "    bs = trial.suggest_int('bs', 4, 128)\n",
    "    b = trial.suggest_float('b', 0, 0.5)\n",
    "    l = trial.suggest_float('l', 0, 0.5)\n",
    "    ee = trial.suggest_categorical('ee', [10,20,50,100])\n",
    "\n",
    "    params = set_params(sub_task.lower().strip())\n",
    "    params['learning_rate'] = lr\n",
    "    params['eval_every'] = ee\n",
    "    params['batch_size'] = bs\n",
    "    params['beta'] = b\n",
    "    params['Lambda'] = l\n",
    "    params['total_iterations'] = min(50*params['eval_every'], 2000)\n",
    "\n",
    "    sub_trainer = Trainer(params)\n",
    "    sub_trainer.agent.load_state_dict(torch.load(params['pretrain_model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "\n",
    "    sub_trainer.agent.train()\n",
    "    sub_trainer.train()\n",
    "    #     torch.save(sub_trainer.agent.state_dict(), params['model_dir'] + 'tmp.ckpt')\n",
    "\n",
    "    params['test_rollouts'] = 100\n",
    "    params['max_num_actions'] = 100\n",
    "    params['eval_batch_size'] = 8\n",
    "\n",
    "    sub_tester = Trainer(params)\n",
    "    sub_tester.agent.load_state_dict(torch.load(params['model_dir'] + 'agent.ckpt', map_location = 'cpu'))\n",
    "    sub_tester.agent.eval()\n",
    "\n",
    "    save_path = sub_tester.save_path\n",
    "    output_dir = sub_tester.output_dir\n",
    "    path_logger_file = output_dir\n",
    "\n",
    "    if not os.path.exists(path_logger_file + \"/\" + \"test_beam\"):\n",
    "        os.mkdir(path_logger_file + \"/\" + \"test_beam\")\n",
    "    sub_tester.path_logger_file_ = path_logger_file + \"/\" + \"test_beam\" + \"/paths\"\n",
    "    with open(output_dir + '/scores.txt', 'a') as score_file:\n",
    "        score_file.write(\"Test (beam) scores with best model from \" + save_path + \"\\n\")\n",
    "\n",
    "    sub_tester.test_environment = sub_tester.test_test_environment\n",
    "    test_results = sub_tester.test(beam=True, print_paths=True, save_model=True)  \n",
    "\n",
    "    sub_tester.data_input_dir = f'../MINERVA/datasets/data_preprocessed/nell-995'\n",
    "\n",
    "    if 'worksfor' == sub_task.lower():\n",
    "        sub_task = sub_task + '.txt'\n",
    "    print(sub_task)\n",
    "    MAP = nell_eval(path_logger_file + \"/\" + \"test_beam/\" + \"pathsanswers\", \n",
    "              sub_tester.data_input_dir+f'/sort_test_{sub_task.lower().strip()}')\n",
    "\n",
    "    del sub_tester, sub_trainer\n",
    "    torch.cuda.empty_cache()\n",
    "    gc.collect()\n",
    "    \n",
    "    return MAP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9e9a1487",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:11:12,472]\u001b[0m A new study created in RDB with name: TeamPlaysSport\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 2, Train loss: -0.2369, rewards: 0.3250\n",
      "Iteration: 4, Train loss: -0.0015, rewards: 0.0158\n",
      "Iteration: 6, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 8, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 10, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 12, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 14, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 16, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 18, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 20, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0054\n",
      "------------------------------------------------------------\n",
      "Iteration: 22, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 24, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 26, Train loss: 0.0000, rewards: 0.0000\n",
      "Iteration: 28, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 30, Train loss: 0.0000, rewards: 0.0000\n",
      "Iteration: 32, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 34, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 36, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 38, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 40, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0016\n",
      "------------------------------------------------------------\n",
      "Iteration: 42, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 44, Train loss: -0.0000, rewards: 0.0333\n",
      "Iteration: 46, Train loss: -0.0008, rewards: 0.1000\n",
      "Iteration: 48, Train loss: -0.0000, rewards: 0.1333\n",
      "Iteration: 50, Train loss: -0.0001, rewards: 0.1992\n",
      "Iteration: 52, Train loss: 0.0000, rewards: 0.2167\n",
      "Iteration: 54, Train loss: -0.0035, rewards: 0.0667\n",
      "Iteration: 56, Train loss: -0.0035, rewards: 0.1833\n",
      "Iteration: 58, Train loss: -0.0020, rewards: 0.0500\n",
      "Iteration: 60, Train loss: -0.0025, rewards: 0.0833\n",
      "Eval:\n",
      "Hits@1: 0.2062, Hits@3: 0.2990, Hits@10: 0.4639, MRR: 0.2759\n",
      "------------------------------------------------------------\n",
      "Iteration: 62, Train loss: -0.0015, rewards: 0.1167\n",
      "Iteration: 64, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 66, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 68, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 70, Train loss: -0.0006, rewards: 0.0000\n",
      "Iteration: 72, Train loss: -0.0017, rewards: 0.0000\n",
      "Iteration: 74, Train loss: -0.0010, rewards: 0.0000\n",
      "Iteration: 76, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 78, Train loss: -0.0036, rewards: 0.0167\n",
      "Iteration: 80, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0007\n",
      "------------------------------------------------------------\n",
      "Iteration: 82, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 84, Train loss: 0.0000, rewards: 0.0000\n",
      "Iteration: 86, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 88, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 90, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 92, Train loss: -0.0001, rewards: 0.0167\n",
      "Iteration: 94, Train loss: -0.0055, rewards: 0.0667\n",
      "Iteration: 96, Train loss: -0.0012, rewards: 0.0167\n",
      "Iteration: 98, Train loss: -0.0060, rewards: 0.0167\n",
      "Iteration: 100, Train loss: 0.0279, rewards: 0.1042\n",
      "Eval:\n",
      "Hits@1: 0.1959, Hits@3: 0.3608, Hits@10: 0.5464, MRR: 0.3085\n",
      "------------------------------------------------------------\n",
      "Iteration: 102, Train loss: 0.0344, rewards: 0.2300\n",
      "Iteration: 104, Train loss: 0.0019, rewards: 0.1667\n",
      "Iteration: 106, Train loss: 0.0260, rewards: 0.1725\n",
      "Iteration: 108, Train loss: 0.0260, rewards: 0.0500\n",
      "Iteration: 110, Train loss: 0.0087, rewards: 0.0875\n",
      "Iteration: 112, Train loss: 0.0139, rewards: 0.1542\n",
      "Iteration: 114, Train loss: 0.0160, rewards: 0.1583\n",
      "Iteration: 116, Train loss: -0.0108, rewards: 0.1592\n",
      "Iteration: 118, Train loss: 0.0074, rewards: 0.2650\n",
      "Iteration: 120, Train loss: -0.0004, rewards: 0.1817\n",
      "Eval:\n",
      "Hits@1: 0.1340, Hits@3: 0.2680, Hits@10: 0.3814, MRR: 0.2189\n",
      "------------------------------------------------------------\n",
      "Iteration: 122, Train loss: -0.0025, rewards: 0.1667\n",
      "Iteration: 124, Train loss: -0.0120, rewards: 0.2333\n",
      "Iteration: 126, Train loss: -0.0041, rewards: 0.2833\n",
      "Iteration: 128, Train loss: 0.0050, rewards: 0.1783\n",
      "Iteration: 130, Train loss: -0.0015, rewards: 0.2000\n",
      "Iteration: 132, Train loss: 0.0074, rewards: 0.2833\n",
      "Iteration: 134, Train loss: 0.0104, rewards: 0.2033\n",
      "Iteration: 136, Train loss: -0.0102, rewards: 0.2833\n",
      "Iteration: 138, Train loss: 0.0229, rewards: 0.2475\n",
      "Iteration: 140, Train loss: 0.0010, rewards: 0.2000\n",
      "Eval:\n",
      "Hits@1: 0.2887, Hits@3: 0.5052, Hits@10: 0.7113, MRR: 0.4225\n",
      "------------------------------------------------------------\n",
      "Iteration: 142, Train loss: 0.0142, rewards: 0.2333\n",
      "Iteration: 144, Train loss: 0.0016, rewards: 0.1000\n",
      "Iteration: 146, Train loss: -0.0018, rewards: 0.1333\n",
      "Iteration: 148, Train loss: -0.0097, rewards: 0.2500\n",
      "Iteration: 150, Train loss: -0.0091, rewards: 0.3333\n",
      "Iteration: 152, Train loss: -0.0069, rewards: 0.3325\n",
      "Iteration: 154, Train loss: -0.0027, rewards: 0.3000\n",
      "Iteration: 156, Train loss: -0.0071, rewards: 0.2333\n",
      "Iteration: 158, Train loss: -0.0070, rewards: 0.2825\n",
      "Iteration: 160, Train loss: -0.0015, rewards: 0.1833\n",
      "Eval:\n",
      "Hits@1: 0.2062, Hits@3: 0.2680, Hits@10: 0.3299, MRR: 0.2478\n",
      "------------------------------------------------------------\n",
      "Iteration: 162, Train loss: -0.0023, rewards: 0.2033\n",
      "Iteration: 164, Train loss: -0.0000, rewards: 0.1833\n",
      "Iteration: 166, Train loss: -0.0040, rewards: 0.0667\n",
      "Iteration: 168, Train loss: 0.0347, rewards: 0.0142\n",
      "Iteration: 170, Train loss: -0.0080, rewards: 0.0000\n",
      "Iteration: 172, Train loss: 0.0081, rewards: 0.0167\n",
      "Iteration: 174, Train loss: -0.0177, rewards: 0.0333\n",
      "Iteration: 176, Train loss: -0.0073, rewards: 0.0000\n",
      "Iteration: 178, Train loss: -0.0061, rewards: 0.0000\n",
      "Iteration: 180, Train loss: -0.0096, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0206, MRR: 0.0082\n",
      "------------------------------------------------------------\n",
      "Iteration: 182, Train loss: -0.0077, rewards: 0.0000\n",
      "Iteration: 184, Train loss: -0.0066, rewards: 0.0000\n",
      "Iteration: 186, Train loss: -0.0073, rewards: 0.0000\n",
      "Iteration: 188, Train loss: -0.0083, rewards: 0.0000\n",
      "Iteration: 190, Train loss: -0.0073, rewards: 0.0000\n",
      "Iteration: 192, Train loss: -0.0066, rewards: 0.0000\n",
      "Iteration: 194, Train loss: -0.0053, rewards: 0.0000\n",
      "Iteration: 196, Train loss: -0.0044, rewards: 0.0000\n",
      "Iteration: 198, Train loss: -0.0043, rewards: 0.0000\n",
      "Iteration: 200, Train loss: -0.0034, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0206, MRR: 0.0070\n",
      "------------------------------------------------------------\n",
      "Iteration: 202, Train loss: -0.0045, rewards: 0.0167\n",
      "Iteration: 204, Train loss: -0.0008, rewards: 0.0000\n",
      "Iteration: 206, Train loss: -0.0008, rewards: 0.0000\n",
      "Iteration: 208, Train loss: -0.0003, rewards: 0.0167\n",
      "Iteration: 210, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 212, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 214, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 216, Train loss: -0.0001, rewards: 0.0167\n",
      "Iteration: 218, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 220, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0103, Hits@3: 0.0103, Hits@10: 0.0103, MRR: 0.0126\n",
      "------------------------------------------------------------\n",
      "Iteration: 222, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 224, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 226, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 228, Train loss: -0.0017, rewards: 0.0167\n",
      "Iteration: 230, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 232, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 234, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 236, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 238, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 240, Train loss: -0.0007, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0103, MRR: 0.0064\n",
      "------------------------------------------------------------\n",
      "Iteration: 242, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 244, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 246, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 248, Train loss: -0.0004, rewards: 0.0000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 250, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 252, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 254, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 256, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 258, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 260, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0041\n",
      "------------------------------------------------------------\n",
      "Iteration: 262, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 264, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 266, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 268, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 270, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 272, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 274, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 276, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 278, Train loss: -0.0007, rewards: 0.0167\n",
      "Iteration: 280, Train loss: -0.0004, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0047\n",
      "------------------------------------------------------------\n",
      "Iteration: 282, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 284, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 286, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 288, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 290, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 292, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 294, Train loss: -0.0011, rewards: 0.0167\n",
      "Iteration: 296, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 298, Train loss: -0.0000, rewards: 0.0333\n",
      "Iteration: 300, Train loss: -0.0001, rewards: 0.0167\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0103, MRR: 0.0053\n",
      "------------------------------------------------------------\n",
      "Iteration: 302, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 304, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 306, Train loss: -0.0007, rewards: 0.0333\n",
      "Iteration: 308, Train loss: -0.0006, rewards: 0.0000\n",
      "Iteration: 310, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 312, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 314, Train loss: -0.0010, rewards: 0.0167\n",
      "Iteration: 316, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 318, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 320, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0103, MRR: 0.0051\n",
      "------------------------------------------------------------\n",
      "Iteration: 322, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 324, Train loss: -0.0010, rewards: 0.0000\n",
      "Iteration: 326, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 328, Train loss: -0.0011, rewards: 0.0167\n",
      "Iteration: 330, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 332, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 334, Train loss: -0.0006, rewards: 0.0000\n",
      "Iteration: 336, Train loss: -0.0003, rewards: 0.0167\n",
      "Iteration: 338, Train loss: -0.0007, rewards: 0.0000\n",
      "Iteration: 340, Train loss: -0.0003, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0206, MRR: 0.0049\n",
      "------------------------------------------------------------\n",
      "Iteration: 342, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 344, Train loss: -0.0014, rewards: 0.0000\n",
      "Iteration: 346, Train loss: -0.0014, rewards: 0.0000\n",
      "Iteration: 348, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 350, Train loss: -0.0011, rewards: 0.0000\n",
      "Iteration: 352, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 354, Train loss: -0.0014, rewards: 0.0167\n",
      "Iteration: 356, Train loss: -0.0014, rewards: 0.0000\n",
      "Iteration: 358, Train loss: -0.0014, rewards: 0.0000\n",
      "Iteration: 360, Train loss: -0.0024, rewards: 0.0167\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0206, MRR: 0.0060\n",
      "------------------------------------------------------------\n",
      "Iteration: 362, Train loss: -0.0017, rewards: 0.0000\n",
      "Iteration: 364, Train loss: -0.0025, rewards: 0.0167\n",
      "Iteration: 366, Train loss: -0.0011, rewards: 0.0000\n",
      "Iteration: 368, Train loss: -0.0016, rewards: 0.0167\n",
      "Iteration: 370, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 372, Train loss: -0.0000, rewards: 0.0167\n",
      "Iteration: 374, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 376, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 378, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 380, Train loss: -0.0018, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0206, Hits@3: 0.0722, Hits@10: 0.1340, MRR: 0.0637\n",
      "------------------------------------------------------------\n",
      "Iteration: 382, Train loss: -0.0052, rewards: 0.0000\n",
      "Iteration: 384, Train loss: -0.0102, rewards: 0.0167\n",
      "Iteration: 386, Train loss: 0.0149, rewards: 0.0508\n",
      "Iteration: 388, Train loss: 0.0288, rewards: 0.1667\n",
      "Iteration: 390, Train loss: 0.0297, rewards: 0.1333\n",
      "Iteration: 392, Train loss: 0.0135, rewards: 0.1000\n",
      "Iteration: 394, Train loss: 0.0055, rewards: 0.2000\n",
      "Iteration: 396, Train loss: 0.0336, rewards: 0.1500\n",
      "Iteration: 398, Train loss: 0.0261, rewards: 0.2333\n",
      "Iteration: 400, Train loss: 0.0381, rewards: 0.2333\n",
      "Eval:\n",
      "Hits@1: 0.2268, Hits@3: 0.3814, Hits@10: 0.4227, MRR: 0.3018\n",
      "------------------------------------------------------------\n",
      "Iteration: 402, Train loss: 0.0201, rewards: 0.1667\n",
      "Iteration: 404, Train loss: 0.0393, rewards: 0.2000\n",
      "Iteration: 406, Train loss: 0.0031, rewards: 0.2333\n",
      "Iteration: 408, Train loss: 0.0178, rewards: 0.1833\n",
      "Iteration: 410, Train loss: 0.0171, rewards: 0.3000\n",
      "Iteration: 412, Train loss: 0.0229, rewards: 0.1167\n",
      "Iteration: 414, Train loss: 0.0261, rewards: 0.2333\n",
      "Iteration: 416, Train loss: 0.0412, rewards: 0.2500\n",
      "Iteration: 418, Train loss: 0.0234, rewards: 0.3167\n",
      "Iteration: 420, Train loss: -0.0001, rewards: 0.2167\n",
      "Eval:\n",
      "Hits@1: 0.2577, Hits@3: 0.3711, Hits@10: 0.4639, MRR: 0.3262\n",
      "------------------------------------------------------------\n",
      "Iteration: 422, Train loss: 0.0361, rewards: 0.2342\n",
      "Iteration: 424, Train loss: 0.0190, rewards: 0.3167\n",
      "Iteration: 426, Train loss: 0.0259, rewards: 0.3500\n",
      "Iteration: 428, Train loss: 0.0186, rewards: 0.3500\n",
      "Iteration: 430, Train loss: 0.0043, rewards: 0.2933\n",
      "Iteration: 432, Train loss: 0.0212, rewards: 0.3167\n",
      "Iteration: 434, Train loss: 0.0004, rewards: 0.3000\n",
      "Iteration: 436, Train loss: 0.0426, rewards: 0.3167\n",
      "Iteration: 438, Train loss: 0.0097, rewards: 0.2000\n",
      "Iteration: 440, Train loss: 0.0122, rewards: 0.2983\n",
      "Eval:\n",
      "Hits@1: 0.2577, Hits@3: 0.3918, Hits@10: 0.5052, MRR: 0.3382\n",
      "------------------------------------------------------------\n",
      "Iteration: 442, Train loss: 0.0338, rewards: 0.3500\n",
      "Iteration: 444, Train loss: 0.0199, rewards: 0.3333\n",
      "Iteration: 446, Train loss: 0.0156, rewards: 0.4333\n",
      "Iteration: 448, Train loss: 0.0178, rewards: 0.3500\n",
      "Iteration: 450, Train loss: 0.0278, rewards: 0.3167\n",
      "Iteration: 452, Train loss: 0.0215, rewards: 0.3667\n",
      "Iteration: 454, Train loss: 0.0222, rewards: 0.2817\n",
      "Iteration: 456, Train loss: 0.0171, rewards: 0.2658\n",
      "Iteration: 458, Train loss: 0.0360, rewards: 0.4500\n",
      "Iteration: 460, Train loss: -0.0109, rewards: 0.4700\n",
      "Eval:\n",
      "Hits@1: 0.3402, Hits@3: 0.4845, Hits@10: 0.6082, MRR: 0.4310\n",
      "------------------------------------------------------------\n",
      "Iteration: 462, Train loss: 0.0223, rewards: 0.3833\n",
      "Iteration: 464, Train loss: 0.0346, rewards: 0.3817\n",
      "Iteration: 466, Train loss: 0.0270, rewards: 0.3667\n",
      "Iteration: 468, Train loss: 0.0293, rewards: 0.2833\n",
      "Iteration: 470, Train loss: 0.0178, rewards: 0.3267\n",
      "Iteration: 472, Train loss: 0.0307, rewards: 0.3833\n",
      "Iteration: 474, Train loss: 0.0123, rewards: 0.4333\n",
      "Iteration: 476, Train loss: 0.0026, rewards: 0.3392\n",
      "Iteration: 478, Train loss: 0.0252, rewards: 0.4000\n",
      "Iteration: 480, Train loss: 0.0173, rewards: 0.3500\n",
      "Eval:\n",
      "Hits@1: 0.3814, Hits@3: 0.4948, Hits@10: 0.6186, MRR: 0.4611\n",
      "------------------------------------------------------------\n",
      "Iteration: 482, Train loss: 0.0264, rewards: 0.3667\n",
      "Iteration: 484, Train loss: 0.0483, rewards: 0.3833\n",
      "Iteration: 486, Train loss: 0.0195, rewards: 0.3000\n",
      "Iteration: 488, Train loss: 0.0171, rewards: 0.3667\n",
      "Iteration: 490, Train loss: 0.0227, rewards: 0.3833\n",
      "Iteration: 492, Train loss: 0.0507, rewards: 0.3833\n",
      "Iteration: 494, Train loss: 0.0296, rewards: 0.3000\n",
      "Iteration: 496, Train loss: 0.0069, rewards: 0.3833\n",
      "Iteration: 498, Train loss: 0.0351, rewards: 0.1833\n",
      "Iteration: 500, Train loss: 0.0329, rewards: 0.4167\n",
      "Eval:\n",
      "Hits@1: 0.3711, Hits@3: 0.5258, Hits@10: 0.6392, MRR: 0.4716\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 502, Train loss: 0.0131, rewards: 0.4333\n",
      "Iteration: 504, Train loss: 0.0482, rewards: 0.3333\n",
      "Iteration: 506, Train loss: 0.0454, rewards: 0.3667\n",
      "Iteration: 508, Train loss: 0.0254, rewards: 0.2850\n",
      "Iteration: 510, Train loss: 0.0267, rewards: 0.3833\n",
      "Iteration: 512, Train loss: 0.0358, rewards: 0.3000\n",
      "Iteration: 514, Train loss: 0.0190, rewards: 0.3500\n",
      "Iteration: 516, Train loss: 0.0210, rewards: 0.4833\n",
      "Iteration: 518, Train loss: 0.0101, rewards: 0.3833\n",
      "Iteration: 520, Train loss: 0.0377, rewards: 0.4667\n",
      "Eval:\n",
      "Hits@1: 0.3402, Hits@3: 0.4845, Hits@10: 0.6392, MRR: 0.4457\n",
      "------------------------------------------------------------\n",
      "Iteration: 522, Train loss: 0.0079, rewards: 0.4167\n",
      "Iteration: 524, Train loss: -0.0045, rewards: 0.3667\n",
      "Iteration: 526, Train loss: 0.0398, rewards: 0.2500\n",
      "Iteration: 528, Train loss: -0.0056, rewards: 0.2333\n",
      "Iteration: 530, Train loss: 0.0399, rewards: 0.3492\n",
      "Iteration: 532, Train loss: 0.0081, rewards: 0.2833\n",
      "Iteration: 534, Train loss: 0.0294, rewards: 0.3833\n",
      "Iteration: 536, Train loss: 0.0313, rewards: 0.3167\n",
      "Iteration: 538, Train loss: 0.0344, rewards: 0.3667\n",
      "Iteration: 540, Train loss: 0.0116, rewards: 0.3667\n",
      "Eval:\n",
      "Hits@1: 0.3402, Hits@3: 0.5052, Hits@10: 0.6392, MRR: 0.4491\n",
      "------------------------------------------------------------\n",
      "Iteration: 542, Train loss: 0.0065, rewards: 0.2833\n",
      "Iteration: 544, Train loss: -0.0009, rewards: 0.3833\n",
      "Iteration: 546, Train loss: 0.0317, rewards: 0.3500\n",
      "Iteration: 548, Train loss: -0.0210, rewards: 0.2333\n",
      "Iteration: 550, Train loss: -0.0175, rewards: 0.3000\n",
      "Iteration: 552, Train loss: -0.0085, rewards: 0.3667\n",
      "Iteration: 554, Train loss: -0.0041, rewards: 0.1667\n",
      "Iteration: 556, Train loss: 0.0071, rewards: 0.1500\n",
      "Iteration: 558, Train loss: 0.0138, rewards: 0.2500\n",
      "Iteration: 560, Train loss: 0.0162, rewards: 0.2167\n",
      "Eval:\n",
      "Hits@1: 0.2371, Hits@3: 0.4639, Hits@10: 0.5979, MRR: 0.3594\n",
      "------------------------------------------------------------\n",
      "Iteration: 562, Train loss: 0.0119, rewards: 0.2667\n",
      "Iteration: 564, Train loss: -0.0087, rewards: 0.2500\n",
      "Iteration: 566, Train loss: 0.0211, rewards: 0.2167\n",
      "Iteration: 568, Train loss: -0.0085, rewards: 0.1833\n",
      "Iteration: 570, Train loss: 0.0380, rewards: 0.2500\n",
      "Iteration: 572, Train loss: 0.0262, rewards: 0.1925\n",
      "Iteration: 574, Train loss: 0.0044, rewards: 0.2825\n",
      "Iteration: 576, Train loss: 0.0085, rewards: 0.2000\n",
      "Iteration: 578, Train loss: 0.0084, rewards: 0.2000\n",
      "Iteration: 580, Train loss: -0.0120, rewards: 0.2500\n",
      "Eval:\n",
      "Hits@1: 0.2474, Hits@3: 0.4639, Hits@10: 0.5773, MRR: 0.3596\n",
      "------------------------------------------------------------\n",
      "Iteration: 582, Train loss: 0.0083, rewards: 0.1833\n",
      "Iteration: 584, Train loss: 0.0014, rewards: 0.2167\n",
      "Iteration: 586, Train loss: 0.0136, rewards: 0.3050\n",
      "Iteration: 588, Train loss: 0.0266, rewards: 0.3000\n",
      "Iteration: 590, Train loss: 0.0082, rewards: 0.3333\n",
      "Iteration: 592, Train loss: 0.0057, rewards: 0.3333\n",
      "Iteration: 594, Train loss: 0.0168, rewards: 0.2667\n",
      "Iteration: 596, Train loss: -0.0177, rewards: 0.2850\n",
      "Iteration: 598, Train loss: 0.0154, rewards: 0.3500\n",
      "Iteration: 600, Train loss: 0.0005, rewards: 0.2500\n",
      "Eval:\n",
      "Hits@1: 0.3093, Hits@3: 0.5052, Hits@10: 0.5876, MRR: 0.4053\n",
      "------------------------------------------------------------\n",
      "Iteration: 602, Train loss: 0.0272, rewards: 0.2783\n",
      "Iteration: 604, Train loss: 0.0051, rewards: 0.2333\n",
      "Iteration: 606, Train loss: -0.0078, rewards: 0.4500\n",
      "Iteration: 608, Train loss: 0.0222, rewards: 0.2667\n",
      "Iteration: 610, Train loss: 0.0338, rewards: 0.1833\n",
      "Iteration: 612, Train loss: -0.0126, rewards: 0.2675\n",
      "Iteration: 614, Train loss: 0.0167, rewards: 0.3333\n",
      "Iteration: 616, Train loss: 0.0203, rewards: 0.2333\n",
      "Iteration: 618, Train loss: 0.0005, rewards: 0.2000\n",
      "Iteration: 620, Train loss: 0.0295, rewards: 0.2500\n",
      "Eval:\n",
      "Hits@1: 0.3402, Hits@3: 0.5052, Hits@10: 0.5876, MRR: 0.4261\n",
      "------------------------------------------------------------\n",
      "Iteration: 622, Train loss: 0.0011, rewards: 0.3158\n",
      "Iteration: 624, Train loss: 0.0173, rewards: 0.3417\n",
      "Iteration: 626, Train loss: 0.0307, rewards: 0.2258\n",
      "Iteration: 628, Train loss: 0.0336, rewards: 0.5167\n",
      "Iteration: 630, Train loss: 0.0309, rewards: 0.4667\n",
      "Iteration: 632, Train loss: 0.0073, rewards: 0.6500\n",
      "Iteration: 634, Train loss: 0.0327, rewards: 0.4667\n",
      "Iteration: 636, Train loss: 0.0023, rewards: 0.6333\n",
      "Iteration: 638, Train loss: 0.0184, rewards: 0.6158\n",
      "Iteration: 640, Train loss: 0.0313, rewards: 0.5667\n",
      "Eval:\n",
      "Hits@1: 0.5052, Hits@3: 0.6186, Hits@10: 0.6804, MRR: 0.5702\n",
      "------------------------------------------------------------\n",
      "Iteration: 642, Train loss: 0.0090, rewards: 0.4167\n",
      "Iteration: 644, Train loss: 0.0222, rewards: 0.4667\n",
      "Iteration: 646, Train loss: 0.0006, rewards: 0.5167\n",
      "Iteration: 648, Train loss: 0.0121, rewards: 0.4833\n",
      "Iteration: 650, Train loss: 0.0173, rewards: 0.5500\n",
      "Iteration: 652, Train loss: -0.0076, rewards: 0.4500\n",
      "Iteration: 654, Train loss: -0.0035, rewards: 0.4167\n",
      "Iteration: 656, Train loss: -0.0262, rewards: 0.4000\n",
      "Iteration: 658, Train loss: -0.0616, rewards: 0.1167\n",
      "Iteration: 660, Train loss: -0.0365, rewards: 0.1000\n",
      "Eval:\n",
      "Hits@1: 0.3711, Hits@3: 0.4536, Hits@10: 0.5361, MRR: 0.4251\n",
      "------------------------------------------------------------\n",
      "Iteration: 662, Train loss: -0.0183, rewards: 0.6333\n",
      "Iteration: 664, Train loss: 0.0525, rewards: 0.4950\n",
      "Iteration: 666, Train loss: 0.0084, rewards: 0.6000\n",
      "Iteration: 668, Train loss: 0.0372, rewards: 0.5833\n",
      "Iteration: 670, Train loss: 0.0385, rewards: 0.5500\n",
      "Iteration: 672, Train loss: 0.0252, rewards: 0.3667\n",
      "Iteration: 674, Train loss: 0.0197, rewards: 0.5833\n",
      "Iteration: 676, Train loss: 0.0092, rewards: 0.6167\n",
      "Iteration: 678, Train loss: -0.0076, rewards: 0.5333\n",
      "Iteration: 680, Train loss: 0.0381, rewards: 0.5667\n",
      "Eval:\n",
      "Hits@1: 0.4948, Hits@3: 0.5670, Hits@10: 0.6289, MRR: 0.5455\n",
      "------------------------------------------------------------\n",
      "Iteration: 682, Train loss: 0.0129, rewards: 0.4500\n",
      "Iteration: 684, Train loss: 0.0198, rewards: 0.4667\n",
      "Iteration: 686, Train loss: 0.0257, rewards: 0.4808\n",
      "Iteration: 688, Train loss: 0.0185, rewards: 0.4833\n",
      "Iteration: 690, Train loss: 0.0182, rewards: 0.5167\n",
      "Iteration: 692, Train loss: -0.0006, rewards: 0.6000\n",
      "Iteration: 694, Train loss: 0.0192, rewards: 0.6167\n",
      "Iteration: 696, Train loss: -0.0014, rewards: 0.5333\n",
      "Iteration: 698, Train loss: 0.0175, rewards: 0.5333\n",
      "Iteration: 700, Train loss: 0.0167, rewards: 0.6000\n",
      "Eval:\n",
      "Hits@1: 0.4639, Hits@3: 0.6082, Hits@10: 0.6598, MRR: 0.5422\n",
      "------------------------------------------------------------\n",
      "Iteration: 702, Train loss: 0.0136, rewards: 0.5150\n",
      "Iteration: 704, Train loss: 0.0157, rewards: 0.5167\n",
      "Iteration: 706, Train loss: 0.0215, rewards: 0.6000\n",
      "Iteration: 708, Train loss: 0.0259, rewards: 0.5333\n",
      "Iteration: 710, Train loss: 0.0141, rewards: 0.6167\n",
      "Iteration: 712, Train loss: 0.0156, rewards: 0.5500\n",
      "Iteration: 714, Train loss: 0.0065, rewards: 0.4833\n",
      "Iteration: 716, Train loss: 0.0316, rewards: 0.4833\n",
      "Iteration: 718, Train loss: -0.0039, rewards: 0.4833\n",
      "Iteration: 720, Train loss: -0.0006, rewards: 0.4833\n",
      "Eval:\n",
      "Hits@1: 0.4124, Hits@3: 0.5876, Hits@10: 0.6598, MRR: 0.5131\n",
      "------------------------------------------------------------\n",
      "Iteration: 722, Train loss: 0.0160, rewards: 0.5167\n",
      "Iteration: 724, Train loss: 0.0343, rewards: 0.6500\n",
      "Iteration: 726, Train loss: 0.0274, rewards: 0.5500\n",
      "Iteration: 728, Train loss: 0.0169, rewards: 0.5833\n",
      "Iteration: 730, Train loss: 0.0378, rewards: 0.4500\n",
      "Iteration: 732, Train loss: 0.0338, rewards: 0.5567\n",
      "Iteration: 734, Train loss: 0.0224, rewards: 0.5000\n",
      "Iteration: 736, Train loss: 0.0203, rewards: 0.4500\n",
      "Iteration: 738, Train loss: 0.0382, rewards: 0.5317\n",
      "Iteration: 740, Train loss: -0.0008, rewards: 0.6000\n",
      "Eval:\n",
      "Hits@1: 0.4433, Hits@3: 0.6082, Hits@10: 0.6804, MRR: 0.5333\n",
      "------------------------------------------------------------\n",
      "Iteration: 742, Train loss: 0.0202, rewards: 0.6333\n",
      "Iteration: 744, Train loss: -0.0124, rewards: 0.4833\n",
      "Iteration: 746, Train loss: 0.0069, rewards: 0.5333\n",
      "Iteration: 748, Train loss: -0.0141, rewards: 0.4167\n",
      "Iteration: 750, Train loss: -0.0031, rewards: 0.5333\n",
      "Iteration: 752, Train loss: -0.0205, rewards: 0.4392\n",
      "Iteration: 754, Train loss: 0.0107, rewards: 0.5000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 756, Train loss: -0.0039, rewards: 0.6333\n",
      "Iteration: 758, Train loss: 0.0024, rewards: 0.4833\n",
      "Iteration: 760, Train loss: 0.0303, rewards: 0.5000\n",
      "Eval:\n",
      "Hits@1: 0.4021, Hits@3: 0.5567, Hits@10: 0.6392, MRR: 0.4863\n",
      "------------------------------------------------------------\n",
      "Iteration: 762, Train loss: 0.0274, rewards: 0.4167\n",
      "Iteration: 764, Train loss: -0.0055, rewards: 0.4833\n",
      "Iteration: 766, Train loss: 0.0147, rewards: 0.5000\n",
      "Iteration: 768, Train loss: -0.0011, rewards: 0.4667\n",
      "Iteration: 770, Train loss: 0.0038, rewards: 0.6500\n",
      "Iteration: 772, Train loss: 0.0222, rewards: 0.6333\n",
      "Iteration: 774, Train loss: 0.0064, rewards: 0.5500\n",
      "Iteration: 776, Train loss: 0.0294, rewards: 0.5000\n",
      "Iteration: 778, Train loss: -0.0041, rewards: 0.4167\n",
      "Iteration: 780, Train loss: 0.0177, rewards: 0.4833\n",
      "Eval:\n",
      "Hits@1: 0.4021, Hits@3: 0.6186, Hits@10: 0.6701, MRR: 0.5122\n",
      "------------------------------------------------------------\n",
      "Iteration: 782, Train loss: 0.0096, rewards: 0.3667\n",
      "Iteration: 784, Train loss: 0.0063, rewards: 0.3833\n",
      "Iteration: 786, Train loss: 0.0172, rewards: 0.4000\n",
      "Iteration: 788, Train loss: -0.0141, rewards: 0.4833\n",
      "Iteration: 790, Train loss: 0.0134, rewards: 0.4333\n",
      "Iteration: 792, Train loss: 0.0049, rewards: 0.3167\n",
      "Iteration: 794, Train loss: 0.0437, rewards: 0.4000\n",
      "Iteration: 796, Train loss: 0.0181, rewards: 0.2833\n",
      "Iteration: 798, Train loss: 0.0002, rewards: 0.4167\n",
      "Iteration: 800, Train loss: 0.0203, rewards: 0.4333\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.4948, Hits@10: 0.6701, MRR: 0.4383\n",
      "------------------------------------------------------------\n",
      "Iteration: 802, Train loss: 0.0056, rewards: 0.3500\n",
      "Iteration: 804, Train loss: 0.0102, rewards: 0.3333\n",
      "Iteration: 806, Train loss: 0.0174, rewards: 0.4167\n",
      "Iteration: 808, Train loss: -0.0014, rewards: 0.4333\n",
      "Iteration: 810, Train loss: 0.0079, rewards: 0.4333\n",
      "Iteration: 812, Train loss: 0.0010, rewards: 0.4833\n",
      "Iteration: 814, Train loss: -0.0259, rewards: 0.4500\n",
      "Iteration: 816, Train loss: -0.0024, rewards: 0.4333\n",
      "Iteration: 818, Train loss: 0.0204, rewards: 0.4833\n",
      "Iteration: 820, Train loss: 0.0073, rewards: 0.4333\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5155, Hits@10: 0.6186, MRR: 0.4410\n",
      "------------------------------------------------------------\n",
      "Iteration: 822, Train loss: 0.0022, rewards: 0.4333\n",
      "Iteration: 824, Train loss: 0.0390, rewards: 0.3833\n",
      "Iteration: 826, Train loss: 0.0186, rewards: 0.4000\n",
      "Iteration: 828, Train loss: 0.0455, rewards: 0.4500\n",
      "Iteration: 830, Train loss: -0.0024, rewards: 0.5000\n",
      "Iteration: 832, Train loss: -0.0014, rewards: 0.2667\n",
      "Iteration: 834, Train loss: 0.0274, rewards: 0.4500\n",
      "Iteration: 836, Train loss: -0.0138, rewards: 0.4167\n",
      "Iteration: 838, Train loss: 0.0228, rewards: 0.4500\n",
      "Iteration: 840, Train loss: 0.0107, rewards: 0.4667\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5361, Hits@10: 0.6186, MRR: 0.4448\n",
      "------------------------------------------------------------\n",
      "Iteration: 842, Train loss: 0.0067, rewards: 0.3000\n",
      "Iteration: 844, Train loss: 0.0158, rewards: 0.4500\n",
      "Iteration: 846, Train loss: -0.0220, rewards: 0.4000\n",
      "Iteration: 848, Train loss: 0.0170, rewards: 0.4500\n",
      "Iteration: 850, Train loss: 0.0149, rewards: 0.3667\n",
      "Iteration: 852, Train loss: -0.0041, rewards: 0.3500\n",
      "Iteration: 854, Train loss: 0.0002, rewards: 0.3833\n",
      "Iteration: 856, Train loss: 0.0065, rewards: 0.5000\n",
      "Iteration: 858, Train loss: 0.0017, rewards: 0.3500\n",
      "Iteration: 860, Train loss: 0.0119, rewards: 0.5000\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 862, Train loss: -0.0062, rewards: 0.3000\n",
      "Iteration: 864, Train loss: 0.0264, rewards: 0.4167\n",
      "Iteration: 866, Train loss: 0.0449, rewards: 0.3500\n",
      "Iteration: 868, Train loss: 0.0185, rewards: 0.4333\n",
      "Iteration: 870, Train loss: -0.0038, rewards: 0.4667\n",
      "Iteration: 872, Train loss: 0.0070, rewards: 0.4667\n",
      "Iteration: 874, Train loss: 0.0077, rewards: 0.4333\n",
      "Iteration: 876, Train loss: 0.0423, rewards: 0.4500\n",
      "Iteration: 878, Train loss: -0.0005, rewards: 0.4000\n",
      "Iteration: 880, Train loss: 0.0030, rewards: 0.4333\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 882, Train loss: 0.0102, rewards: 0.4167\n",
      "Iteration: 884, Train loss: 0.0112, rewards: 0.3667\n",
      "Iteration: 886, Train loss: 0.0076, rewards: 0.3833\n",
      "Iteration: 888, Train loss: 0.0084, rewards: 0.4833\n",
      "Iteration: 890, Train loss: 0.0328, rewards: 0.4167\n",
      "Iteration: 892, Train loss: -0.0113, rewards: 0.3833\n",
      "Iteration: 894, Train loss: -0.0033, rewards: 0.4167\n",
      "Iteration: 896, Train loss: -0.0032, rewards: 0.3667\n",
      "Iteration: 898, Train loss: 0.0090, rewards: 0.3333\n",
      "Iteration: 900, Train loss: 0.0006, rewards: 0.4667\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 902, Train loss: 0.0138, rewards: 0.3833\n",
      "Iteration: 904, Train loss: 0.0124, rewards: 0.4333\n",
      "Iteration: 906, Train loss: 0.0154, rewards: 0.3167\n",
      "Iteration: 908, Train loss: -0.0119, rewards: 0.3833\n",
      "Iteration: 910, Train loss: 0.0180, rewards: 0.4167\n",
      "Iteration: 912, Train loss: 0.0226, rewards: 0.3667\n",
      "Iteration: 914, Train loss: 0.0063, rewards: 0.3333\n",
      "Iteration: 916, Train loss: 0.0169, rewards: 0.3667\n",
      "Iteration: 918, Train loss: 0.0092, rewards: 0.4500\n",
      "Iteration: 920, Train loss: 0.0095, rewards: 0.4000\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 922, Train loss: 0.0066, rewards: 0.3500\n",
      "Iteration: 924, Train loss: 0.0147, rewards: 0.4167\n",
      "Iteration: 926, Train loss: 0.0171, rewards: 0.4000\n",
      "Iteration: 928, Train loss: 0.0163, rewards: 0.3667\n",
      "Iteration: 930, Train loss: 0.0067, rewards: 0.3500\n",
      "Iteration: 932, Train loss: 0.0148, rewards: 0.4500\n",
      "Iteration: 934, Train loss: -0.0092, rewards: 0.5000\n",
      "Iteration: 936, Train loss: -0.0011, rewards: 0.3667\n",
      "Iteration: 938, Train loss: 0.0029, rewards: 0.4667\n",
      "Iteration: 940, Train loss: 0.0009, rewards: 0.4167\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 942, Train loss: -0.0023, rewards: 0.3333\n",
      "Iteration: 944, Train loss: 0.0058, rewards: 0.4167\n",
      "Iteration: 946, Train loss: 0.0268, rewards: 0.5333\n",
      "Iteration: 948, Train loss: 0.0039, rewards: 0.4333\n",
      "Iteration: 950, Train loss: -0.0105, rewards: 0.4333\n",
      "Iteration: 952, Train loss: 0.0217, rewards: 0.5000\n",
      "Iteration: 954, Train loss: -0.0215, rewards: 0.3667\n",
      "Iteration: 956, Train loss: 0.0393, rewards: 0.5333\n",
      "Iteration: 958, Train loss: -0.0107, rewards: 0.3500\n",
      "Iteration: 960, Train loss: -0.0034, rewards: 0.4833\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 962, Train loss: 0.0108, rewards: 0.4000\n",
      "Iteration: 964, Train loss: 0.0267, rewards: 0.4333\n",
      "Iteration: 966, Train loss: -0.0044, rewards: 0.4333\n",
      "Iteration: 968, Train loss: 0.0197, rewards: 0.3667\n",
      "Iteration: 970, Train loss: 0.0252, rewards: 0.4500\n",
      "Iteration: 972, Train loss: 0.0427, rewards: 0.4000\n",
      "Iteration: 974, Train loss: 0.0319, rewards: 0.4333\n",
      "Iteration: 976, Train loss: 0.0198, rewards: 0.5000\n",
      "Iteration: 978, Train loss: -0.0056, rewards: 0.3667\n",
      "Iteration: 980, Train loss: 0.0274, rewards: 0.4167\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "Iteration: 982, Train loss: 0.0148, rewards: 0.4333\n",
      "Iteration: 984, Train loss: 0.0304, rewards: 0.4333\n",
      "Iteration: 986, Train loss: -0.0374, rewards: 0.4000\n",
      "Iteration: 988, Train loss: 0.0046, rewards: 0.4833\n",
      "Iteration: 990, Train loss: -0.0125, rewards: 0.4000\n",
      "Iteration: 992, Train loss: 0.0143, rewards: 0.3833\n",
      "Iteration: 994, Train loss: 0.0240, rewards: 0.4500\n",
      "Iteration: 996, Train loss: 0.0371, rewards: 0.3667\n",
      "Iteration: 998, Train loss: 0.0010, rewards: 0.4667\n",
      "Iteration: 1000, Train loss: -0.0105, rewards: 0.4000\n",
      "Eval:\n",
      "Hits@1: 0.3299, Hits@3: 0.5258, Hits@10: 0.6186, MRR: 0.4438\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.2321, Hits@3: 0.4732, Hits@10: 0.7589, MRR: 0.3976\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.782312925170068 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:31:19,173]\u001b[0m Trial 0 finished with value: 0.782312925170068 and parameters: {'lr': 0.004179118013024347, 'bs': 30, 'b': 0.09117422764572974, 'l': 0.08052106610329096, 'ee': 20}. Best is trial 0 with value: 0.782312925170068.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 1, Train loss: -0.3970, rewards: 0.4222\n",
      "Iteration: 2, Train loss: 0.0211, rewards: 0.1889\n",
      "Iteration: 3, Train loss: -0.0072, rewards: 0.2037\n",
      "Iteration: 4, Train loss: -0.0069, rewards: 0.3704\n",
      "Iteration: 5, Train loss: -0.0022, rewards: 0.3889\n",
      "Iteration: 6, Train loss: 0.0032, rewards: 0.2843\n",
      "Iteration: 7, Train loss: -0.0012, rewards: 0.0556\n",
      "Iteration: 8, Train loss: -0.0015, rewards: 0.0000\n",
      "Iteration: 9, Train loss: -0.0018, rewards: 0.0000\n",
      "Iteration: 10, Train loss: -0.0020, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0013\n",
      "------------------------------------------------------------\n",
      "Iteration: 11, Train loss: -0.0023, rewards: 0.0000\n",
      "Iteration: 12, Train loss: -0.0020, rewards: 0.0000\n",
      "Iteration: 13, Train loss: -0.0016, rewards: 0.0000\n",
      "Iteration: 14, Train loss: -0.0016, rewards: 0.0000\n",
      "Iteration: 15, Train loss: -0.0006, rewards: 0.0000\n",
      "Iteration: 16, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 17, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 18, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 19, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 20, Train loss: -0.0009, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0000\n",
      "------------------------------------------------------------\n",
      "Iteration: 21, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 22, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 23, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 24, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 25, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 26, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 27, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 28, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 29, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 30, Train loss: -0.0003, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0000\n",
      "------------------------------------------------------------\n",
      "Iteration: 31, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 32, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 33, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 34, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 35, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 36, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 37, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 38, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 39, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 40, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0000\n",
      "------------------------------------------------------------\n",
      "Iteration: 41, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 42, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 43, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 44, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 45, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 46, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 47, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 48, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 49, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 50, Train loss: -0.0006, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0006\n",
      "------------------------------------------------------------\n",
      "Iteration: 51, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 52, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 53, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 54, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 55, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 56, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 57, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 58, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 59, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 60, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0031\n",
      "------------------------------------------------------------\n",
      "Iteration: 61, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 62, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 63, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 64, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 65, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 66, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 67, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 68, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 69, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 70, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0035\n",
      "------------------------------------------------------------\n",
      "Iteration: 71, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 72, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 73, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 74, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 75, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 76, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 77, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 78, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 79, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 80, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0027\n",
      "------------------------------------------------------------\n",
      "Iteration: 81, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 82, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 83, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 84, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 85, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 86, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 87, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 88, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 89, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 90, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 91, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 92, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 93, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 94, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 95, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 96, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 97, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 98, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 99, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 100, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 101, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 102, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 103, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 104, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 105, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 106, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 107, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 108, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 109, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 110, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 111, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 112, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 113, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 114, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 115, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 116, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 117, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 118, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 119, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 120, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 121, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 122, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 123, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 124, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 125, Train loss: -0.0000, rewards: 0.0000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 126, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 127, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 128, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 129, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 130, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 131, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 132, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 133, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 134, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 135, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 136, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 137, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 138, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 139, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 140, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 141, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 142, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 143, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 144, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 145, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 146, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 147, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 148, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 149, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 150, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 151, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 152, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 153, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 154, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 155, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 156, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 157, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 158, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 159, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 160, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 161, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 162, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 163, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 164, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 165, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 166, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 167, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 168, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 169, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 170, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 171, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 172, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 173, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 174, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 175, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 176, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 177, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 178, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 179, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 180, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 181, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 182, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 183, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 184, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 185, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 186, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 187, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 188, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 189, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 190, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 191, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 192, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 193, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 194, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 195, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 196, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 197, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 198, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 199, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 200, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 201, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 202, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 203, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 204, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 205, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 206, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 207, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 208, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 209, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 210, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 211, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 212, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 213, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 214, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 215, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 216, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 217, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 218, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 219, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 220, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 221, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 222, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 223, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 224, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 225, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 226, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 227, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 228, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 229, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 230, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 231, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 232, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 233, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 234, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 235, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 236, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 237, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 238, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 239, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 240, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 241, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 242, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 243, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 244, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 245, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 246, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 247, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 248, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 249, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 250, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 251, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 252, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 253, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 254, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 255, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 256, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 257, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 258, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 259, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 260, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 261, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 262, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 263, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 264, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 265, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 266, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 267, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 268, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 269, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 270, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 271, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 272, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 273, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 274, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 275, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 276, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 277, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 278, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 279, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 280, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 281, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 282, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 283, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 284, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 285, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 286, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 287, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 288, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 289, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 290, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 291, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 292, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 293, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 294, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 295, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 296, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 297, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 298, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 299, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 300, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 301, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 302, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 303, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 304, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 305, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 306, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 307, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 308, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 309, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 310, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 311, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 312, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 313, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 314, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 315, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 316, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 317, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 318, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 319, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 320, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 321, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 322, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 323, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 324, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 325, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 326, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 327, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 328, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 329, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 330, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 331, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 332, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 333, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 334, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 335, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 336, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 337, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 338, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 339, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 340, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 341, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 342, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 343, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 344, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 345, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 346, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 347, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 348, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 349, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 350, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 351, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 352, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 353, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 354, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 355, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 356, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 357, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 358, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 359, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 360, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 361, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 362, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 363, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 364, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 365, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 366, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 367, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 368, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 369, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 370, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 371, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 372, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 373, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 374, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 375, Train loss: -0.0000, rewards: 0.0000\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 376, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 377, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 378, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 379, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 380, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 381, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 382, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 383, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 384, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 385, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 386, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 387, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 388, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 389, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 390, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 391, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 392, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 393, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 394, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 395, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 396, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 397, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 398, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 399, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 400, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 401, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 402, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 403, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 404, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 405, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 406, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 407, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 408, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 409, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 410, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 411, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 412, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 413, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 414, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 415, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 416, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 417, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 418, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 419, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 420, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 421, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 422, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 423, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 424, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 425, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 426, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 427, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 428, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 429, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 430, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 431, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 432, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 433, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 434, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 435, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 436, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 437, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 438, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 439, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 440, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 441, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 442, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 443, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 444, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 445, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 446, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 447, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 448, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 449, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 450, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 451, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 452, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 453, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 454, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 455, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 456, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 457, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 458, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 459, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 460, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 461, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 462, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 463, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 464, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 465, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 466, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 467, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 468, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 469, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 470, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 471, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 472, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 473, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 474, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 475, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 476, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 477, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 478, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 479, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 480, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 481, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 482, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 483, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 484, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 485, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 486, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 487, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 488, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 489, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 490, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n",
      "------------------------------------------------------------\n",
      "Iteration: 491, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 492, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 493, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 494, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 495, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 496, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 497, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 498, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 499, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 500, Train loss: -0.0000, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0103, MRR: 0.0021\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 501, Train loss: -0.0000, rewards: 0.0000\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.0000, Hits@3: 0.0089, Hits@10: 0.0268, MRR: 0.0075\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.5346513605442177 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 21:47:20,259]\u001b[0m Trial 1 finished with value: 0.5346513605442177 and parameters: {'lr': 0.0046128743803208125, 'bs': 54, 'b': 0.06120348336555298, 'l': 0.17442519261654532, 'ee': 10}. Best is trial 0 with value: 0.782312925170068.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -1.0981, rewards: 0.0876\n",
      "Iteration: 20, Train loss: -1.3957, rewards: 0.1769\n",
      "Iteration: 30, Train loss: -1.4607, rewards: 0.1905\n",
      "Iteration: 40, Train loss: -1.5178, rewards: 0.2193\n",
      "Iteration: 50, Train loss: -1.4860, rewards: 0.2983\n",
      "Iteration: 60, Train loss: -1.5705, rewards: 0.2693\n",
      "Iteration: 70, Train loss: -1.5420, rewards: 0.2993\n",
      "Iteration: 80, Train loss: -1.4740, rewards: 0.2936\n",
      "Iteration: 90, Train loss: -1.5681, rewards: 0.3169\n",
      "Iteration: 100, Train loss: -1.4643, rewards: 0.2814\n",
      "Eval:\n",
      "Hits@1: 0.5567, Hits@3: 0.7216, Hits@10: 0.7938, MRR: 0.6452\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -1.4674, rewards: 0.3188\n",
      "Iteration: 120, Train loss: -1.4521, rewards: 0.3126\n",
      "Iteration: 130, Train loss: -1.4679, rewards: 0.3414\n",
      "Iteration: 140, Train loss: -1.5418, rewards: 0.2814\n",
      "Iteration: 150, Train loss: -1.3846, rewards: 0.2981\n",
      "Iteration: 160, Train loss: -1.4357, rewards: 0.3357\n",
      "Iteration: 170, Train loss: -1.5245, rewards: 0.3207\n",
      "Iteration: 180, Train loss: -1.4483, rewards: 0.2860\n",
      "Iteration: 190, Train loss: -1.4356, rewards: 0.2867\n",
      "Iteration: 200, Train loss: -1.4449, rewards: 0.3252\n",
      "Eval:\n",
      "Hits@1: 0.5773, Hits@3: 0.7423, Hits@10: 0.8454, MRR: 0.6701\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -1.3859, rewards: 0.3279\n",
      "Iteration: 220, Train loss: -1.3904, rewards: 0.4105\n",
      "Iteration: 230, Train loss: -1.4886, rewards: 0.3476\n",
      "Iteration: 240, Train loss: -1.4077, rewards: 0.3543\n",
      "Iteration: 250, Train loss: -1.4655, rewards: 0.3114\n",
      "Iteration: 260, Train loss: -1.4260, rewards: 0.3369\n",
      "Iteration: 270, Train loss: -1.4432, rewards: 0.3279\n",
      "Iteration: 280, Train loss: -1.4854, rewards: 0.3702\n",
      "Iteration: 290, Train loss: -1.4518, rewards: 0.3121\n",
      "Iteration: 300, Train loss: -1.4390, rewards: 0.3393\n",
      "Eval:\n",
      "Hits@1: 0.6495, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7130\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -1.4563, rewards: 0.3157\n",
      "Iteration: 320, Train loss: -1.4927, rewards: 0.3562\n",
      "Iteration: 330, Train loss: -1.4556, rewards: 0.3583\n",
      "Iteration: 340, Train loss: -1.5685, rewards: 0.3771\n",
      "Iteration: 350, Train loss: -1.5773, rewards: 0.3250\n",
      "Iteration: 360, Train loss: -1.4656, rewards: 0.3195\n",
      "Iteration: 370, Train loss: -1.3993, rewards: 0.3740\n",
      "Iteration: 380, Train loss: -1.5001, rewards: 0.3826\n",
      "Iteration: 390, Train loss: -1.3875, rewards: 0.3021\n",
      "Iteration: 400, Train loss: -1.4902, rewards: 0.3398\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7629, Hits@10: 0.8351, MRR: 0.7291\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -1.4676, rewards: 0.3505\n",
      "Iteration: 420, Train loss: -1.3997, rewards: 0.3240\n",
      "Iteration: 430, Train loss: -1.4409, rewards: 0.3250\n",
      "Iteration: 440, Train loss: -1.3811, rewards: 0.3271\n",
      "Iteration: 450, Train loss: -1.4924, rewards: 0.3900\n",
      "Iteration: 460, Train loss: -1.4775, rewards: 0.3552\n",
      "Iteration: 470, Train loss: -1.4008, rewards: 0.3540\n",
      "Iteration: 480, Train loss: -1.4581, rewards: 0.3650\n",
      "Iteration: 490, Train loss: -1.4045, rewards: 0.3348\n",
      "Iteration: 500, Train loss: -1.4544, rewards: 0.3907\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7219\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -1.5394, rewards: 0.3886\n",
      "Iteration: 520, Train loss: -1.5478, rewards: 0.3402\n",
      "Iteration: 530, Train loss: -1.4220, rewards: 0.3807\n",
      "Iteration: 540, Train loss: -1.3804, rewards: 0.3688\n",
      "Iteration: 550, Train loss: -1.4314, rewards: 0.3914\n",
      "Iteration: 560, Train loss: -1.5124, rewards: 0.3643\n",
      "Iteration: 570, Train loss: -1.4447, rewards: 0.3812\n",
      "Iteration: 580, Train loss: -1.5113, rewards: 0.3321\n",
      "Iteration: 590, Train loss: -1.3526, rewards: 0.3324\n",
      "Iteration: 600, Train loss: -1.4646, rewards: 0.3519\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7835, Hits@10: 0.8247, MRR: 0.7321\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -1.4457, rewards: 0.3767\n",
      "Iteration: 620, Train loss: -1.4244, rewards: 0.3614\n",
      "Iteration: 630, Train loss: -1.4326, rewards: 0.3600\n",
      "Iteration: 640, Train loss: -1.5600, rewards: 0.3474\n",
      "Iteration: 650, Train loss: -1.5336, rewards: 0.3629\n",
      "Iteration: 660, Train loss: -1.4808, rewards: 0.3826\n",
      "Iteration: 670, Train loss: -1.5019, rewards: 0.3369\n",
      "Iteration: 680, Train loss: -1.4470, rewards: 0.3390\n",
      "Iteration: 690, Train loss: -1.3210, rewards: 0.3719\n",
      "Iteration: 700, Train loss: -1.4158, rewards: 0.3819\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7311\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -1.5448, rewards: 0.3624\n",
      "Iteration: 720, Train loss: -1.5229, rewards: 0.3431\n",
      "Iteration: 730, Train loss: -1.4360, rewards: 0.3455\n",
      "Iteration: 740, Train loss: -1.3883, rewards: 0.4029\n",
      "Iteration: 750, Train loss: -1.4250, rewards: 0.3529\n",
      "Iteration: 760, Train loss: -1.2471, rewards: 0.3426\n",
      "Iteration: 770, Train loss: -1.4660, rewards: 0.3483\n",
      "Iteration: 780, Train loss: -1.4401, rewards: 0.3840\n",
      "Iteration: 790, Train loss: -1.5128, rewards: 0.3367\n",
      "Iteration: 800, Train loss: -1.5350, rewards: 0.3812\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7291\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -1.4160, rewards: 0.3498\n",
      "Iteration: 820, Train loss: -1.3795, rewards: 0.3583\n",
      "Iteration: 830, Train loss: -1.3971, rewards: 0.3736\n",
      "Iteration: 840, Train loss: -1.4708, rewards: 0.3605\n",
      "Iteration: 850, Train loss: -1.4802, rewards: 0.3545\n",
      "Iteration: 860, Train loss: -1.4574, rewards: 0.3636\n",
      "Iteration: 870, Train loss: -1.3415, rewards: 0.3781\n",
      "Iteration: 880, Train loss: -1.4602, rewards: 0.3552\n",
      "Iteration: 890, Train loss: -1.5313, rewards: 0.3929\n",
      "Iteration: 900, Train loss: -1.4476, rewards: 0.3679\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7732, Hits@10: 0.8041, MRR: 0.7214\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -1.4861, rewards: 0.3762\n",
      "Iteration: 920, Train loss: -1.4282, rewards: 0.3717\n",
      "Iteration: 930, Train loss: -1.5217, rewards: 0.3424\n",
      "Iteration: 940, Train loss: -1.5539, rewards: 0.3307\n",
      "Iteration: 950, Train loss: -1.4459, rewards: 0.3836\n",
      "Iteration: 960, Train loss: -1.4048, rewards: 0.3543\n",
      "Iteration: 970, Train loss: -1.4445, rewards: 0.3607\n",
      "Iteration: 980, Train loss: -1.4351, rewards: 0.3990\n",
      "Iteration: 990, Train loss: -1.4228, rewards: 0.3588\n",
      "Iteration: 1000, Train loss: -1.4843, rewards: 0.3762\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7341\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -1.4411, rewards: 0.3840\n",
      "Iteration: 1020, Train loss: -1.3232, rewards: 0.3688\n",
      "Iteration: 1030, Train loss: -1.4805, rewards: 0.4021\n",
      "Iteration: 1040, Train loss: -1.5287, rewards: 0.3595\n",
      "Iteration: 1050, Train loss: -1.5033, rewards: 0.3621\n",
      "Iteration: 1060, Train loss: -1.4072, rewards: 0.3871\n",
      "Iteration: 1070, Train loss: -1.5600, rewards: 0.3895\n",
      "Iteration: 1080, Train loss: -1.5071, rewards: 0.3869\n",
      "Iteration: 1090, Train loss: -1.5486, rewards: 0.3700\n",
      "Iteration: 1100, Train loss: -1.4641, rewards: 0.3398\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.7938, MRR: 0.7315\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -1.5515, rewards: 0.3943\n",
      "Iteration: 1120, Train loss: -1.4591, rewards: 0.3631\n",
      "Iteration: 1130, Train loss: -1.4927, rewards: 0.3557\n",
      "Iteration: 1140, Train loss: -1.4495, rewards: 0.3683\n",
      "Iteration: 1150, Train loss: -1.4947, rewards: 0.3629\n",
      "Iteration: 1160, Train loss: -1.4922, rewards: 0.4050\n",
      "Iteration: 1170, Train loss: -1.4447, rewards: 0.3455\n",
      "Iteration: 1180, Train loss: -1.4946, rewards: 0.3686\n",
      "Iteration: 1190, Train loss: -1.4029, rewards: 0.3786\n",
      "Iteration: 1200, Train loss: -1.4924, rewards: 0.3429\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7333\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -1.4530, rewards: 0.3379\n",
      "Iteration: 1220, Train loss: -1.4890, rewards: 0.3907\n",
      "Iteration: 1230, Train loss: -1.5596, rewards: 0.3683\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -1.5009, rewards: 0.3874\n",
      "Iteration: 1250, Train loss: -1.5304, rewards: 0.3855\n",
      "Iteration: 1260, Train loss: -1.3183, rewards: 0.3883\n",
      "Iteration: 1270, Train loss: -1.5782, rewards: 0.3640\n",
      "Iteration: 1280, Train loss: -1.4293, rewards: 0.3495\n",
      "Iteration: 1290, Train loss: -1.3697, rewards: 0.3505\n",
      "Iteration: 1300, Train loss: -1.4444, rewards: 0.3448\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7412\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -1.4077, rewards: 0.3721\n",
      "Iteration: 1320, Train loss: -1.4778, rewards: 0.3898\n",
      "Iteration: 1330, Train loss: -1.4341, rewards: 0.3721\n",
      "Iteration: 1340, Train loss: -1.4249, rewards: 0.3374\n",
      "Iteration: 1350, Train loss: -1.5565, rewards: 0.3955\n",
      "Iteration: 1360, Train loss: -1.5317, rewards: 0.3302\n",
      "Iteration: 1370, Train loss: -1.3966, rewards: 0.3752\n",
      "Iteration: 1380, Train loss: -1.6025, rewards: 0.3752\n",
      "Iteration: 1390, Train loss: -1.4175, rewards: 0.3379\n",
      "Iteration: 1400, Train loss: -1.4783, rewards: 0.4026\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7526, Hits@10: 0.8144, MRR: 0.7158\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -1.4022, rewards: 0.3540\n",
      "Iteration: 1420, Train loss: -1.4707, rewards: 0.3574\n",
      "Iteration: 1430, Train loss: -1.4790, rewards: 0.3848\n",
      "Iteration: 1440, Train loss: -1.5785, rewards: 0.3505\n",
      "Iteration: 1450, Train loss: -1.5059, rewards: 0.4214\n",
      "Iteration: 1460, Train loss: -1.5291, rewards: 0.3617\n",
      "Iteration: 1470, Train loss: -1.5179, rewards: 0.3821\n",
      "Iteration: 1480, Train loss: -1.4890, rewards: 0.3883\n",
      "Iteration: 1490, Train loss: -1.4734, rewards: 0.3962\n",
      "Iteration: 1500, Train loss: -1.4894, rewards: 0.3912\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7298\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -1.4216, rewards: 0.3586\n",
      "Iteration: 1520, Train loss: -1.4958, rewards: 0.3429\n",
      "Iteration: 1530, Train loss: -1.4582, rewards: 0.3624\n",
      "Iteration: 1540, Train loss: -1.4489, rewards: 0.3345\n",
      "Iteration: 1550, Train loss: -1.4095, rewards: 0.4005\n",
      "Iteration: 1560, Train loss: -1.5055, rewards: 0.3476\n",
      "Iteration: 1570, Train loss: -1.4530, rewards: 0.3719\n",
      "Iteration: 1580, Train loss: -1.4096, rewards: 0.3581\n",
      "Iteration: 1590, Train loss: -1.4685, rewards: 0.3605\n",
      "Iteration: 1600, Train loss: -1.4643, rewards: 0.3986\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7320, Hits@10: 0.8144, MRR: 0.7151\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -1.4603, rewards: 0.3562\n",
      "Iteration: 1620, Train loss: -1.5895, rewards: 0.3662\n",
      "Iteration: 1630, Train loss: -1.4689, rewards: 0.3321\n",
      "Iteration: 1640, Train loss: -1.4595, rewards: 0.3645\n",
      "Iteration: 1650, Train loss: -1.4452, rewards: 0.4119\n",
      "Iteration: 1660, Train loss: -1.4591, rewards: 0.3576\n",
      "Iteration: 1670, Train loss: -1.4796, rewards: 0.3971\n",
      "Iteration: 1680, Train loss: -1.5085, rewards: 0.3683\n",
      "Iteration: 1690, Train loss: -1.4230, rewards: 0.3726\n",
      "Iteration: 1700, Train loss: -1.4135, rewards: 0.3679\n",
      "Eval:\n",
      "Hits@1: 0.6495, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7098\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -1.5007, rewards: 0.3852\n",
      "Iteration: 1720, Train loss: -1.4248, rewards: 0.3607\n",
      "Iteration: 1730, Train loss: -1.4964, rewards: 0.3650\n",
      "Iteration: 1740, Train loss: -1.3837, rewards: 0.3600\n",
      "Iteration: 1750, Train loss: -1.4953, rewards: 0.3536\n",
      "Iteration: 1760, Train loss: -1.5235, rewards: 0.3831\n",
      "Iteration: 1770, Train loss: -1.4805, rewards: 0.4188\n",
      "Iteration: 1780, Train loss: -1.4041, rewards: 0.3479\n",
      "Iteration: 1790, Train loss: -1.4834, rewards: 0.4276\n",
      "Iteration: 1800, Train loss: -1.5447, rewards: 0.3536\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7835, Hits@10: 0.8351, MRR: 0.7291\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -1.4838, rewards: 0.4040\n",
      "Iteration: 1820, Train loss: -1.5094, rewards: 0.3533\n",
      "Iteration: 1830, Train loss: -1.4911, rewards: 0.3669\n",
      "Iteration: 1840, Train loss: -1.4952, rewards: 0.3490\n",
      "Iteration: 1850, Train loss: -1.4095, rewards: 0.4071\n",
      "Iteration: 1860, Train loss: -1.4168, rewards: 0.3550\n",
      "Iteration: 1870, Train loss: -1.4715, rewards: 0.3531\n",
      "Iteration: 1880, Train loss: -1.3296, rewards: 0.3707\n",
      "Iteration: 1890, Train loss: -1.4576, rewards: 0.3729\n",
      "Iteration: 1900, Train loss: -1.4735, rewards: 0.3545\n",
      "Eval:\n",
      "Hits@1: 0.6495, Hits@3: 0.7320, Hits@10: 0.8144, MRR: 0.7007\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -1.4183, rewards: 0.4043\n",
      "Iteration: 1920, Train loss: -1.4373, rewards: 0.3152\n",
      "Iteration: 1930, Train loss: -1.3097, rewards: 0.4264\n",
      "Iteration: 1940, Train loss: -1.5269, rewards: 0.3348\n",
      "Iteration: 1950, Train loss: -1.3534, rewards: 0.4176\n",
      "Iteration: 1960, Train loss: -1.5302, rewards: 0.3407\n",
      "Iteration: 1970, Train loss: -1.4633, rewards: 0.3671\n",
      "Iteration: 1980, Train loss: -1.4618, rewards: 0.3731\n",
      "Iteration: 1990, Train loss: -1.3744, rewards: 0.3605\n",
      "Iteration: 2000, Train loss: -1.4602, rewards: 0.3555\n",
      "Eval:\n",
      "Hits@1: 0.6598, Hits@3: 0.7423, Hits@10: 0.8144, MRR: 0.7061\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.4554, Hits@3: 0.7054, Hits@10: 0.8750, MRR: 0.6115\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.7674319727891156 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 22:15:04,911]\u001b[0m Trial 2 finished with value: 0.7674319727891156 and parameters: {'lr': 0.0035805978976039717, 'bs': 21, 'b': 0.4687353054080137, 'l': 0.3684439802822461, 'ee': 100}. Best is trial 0 with value: 0.782312925170068.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 1, Train loss: -1.0445, rewards: 0.3643\n",
      "Iteration: 2, Train loss: -0.7907, rewards: 0.0039\n",
      "Iteration: 3, Train loss: -1.0652, rewards: 0.0097\n",
      "Iteration: 4, Train loss: -1.1423, rewards: 0.0987\n",
      "Iteration: 5, Train loss: -1.0733, rewards: 0.0221\n",
      "Iteration: 6, Train loss: -1.0711, rewards: 0.0435\n",
      "Iteration: 7, Train loss: -1.3849, rewards: 0.1091\n",
      "Iteration: 8, Train loss: -1.4317, rewards: 0.1617\n",
      "Iteration: 9, Train loss: -1.3285, rewards: 0.1747\n",
      "Iteration: 10, Train loss: -1.2980, rewards: 0.1273\n",
      "Eval:\n",
      "Hits@1: 0.3608, Hits@3: 0.5258, Hits@10: 0.7526, MRR: 0.4805\n",
      "------------------------------------------------------------\n",
      "Iteration: 11, Train loss: -1.3412, rewards: 0.0929\n",
      "Iteration: 12, Train loss: -1.3032, rewards: 0.1149\n",
      "Iteration: 13, Train loss: -1.4920, rewards: 0.1981\n",
      "Iteration: 14, Train loss: -1.4736, rewards: 0.2149\n",
      "Iteration: 15, Train loss: -1.2186, rewards: 0.2052\n",
      "Iteration: 16, Train loss: -1.4978, rewards: 0.2169\n",
      "Iteration: 17, Train loss: -1.4881, rewards: 0.3383\n",
      "Iteration: 18, Train loss: -1.5630, rewards: 0.2097\n",
      "Iteration: 19, Train loss: -1.4168, rewards: 0.1812\n",
      "Iteration: 20, Train loss: -1.3794, rewards: 0.2532\n",
      "Eval:\n",
      "Hits@1: 0.4227, Hits@3: 0.6495, Hits@10: 0.7732, MRR: 0.5371\n",
      "------------------------------------------------------------\n",
      "Iteration: 21, Train loss: -1.4608, rewards: 0.2890\n",
      "Iteration: 22, Train loss: -1.3745, rewards: 0.2487\n",
      "Iteration: 23, Train loss: -1.4697, rewards: 0.2370\n",
      "Iteration: 24, Train loss: -1.6284, rewards: 0.2162\n",
      "Iteration: 25, Train loss: -1.5538, rewards: 0.1838\n",
      "Iteration: 26, Train loss: -1.2641, rewards: 0.1896\n",
      "Iteration: 27, Train loss: -1.4373, rewards: 0.3325\n",
      "Iteration: 28, Train loss: -1.3972, rewards: 0.3695\n",
      "Iteration: 29, Train loss: -1.4373, rewards: 0.2461\n",
      "Iteration: 30, Train loss: -1.3064, rewards: 0.2552\n",
      "Eval:\n",
      "Hits@1: 0.5052, Hits@3: 0.7010, Hits@10: 0.8144, MRR: 0.6087\n",
      "------------------------------------------------------------\n",
      "Iteration: 31, Train loss: -1.4483, rewards: 0.2344\n",
      "Iteration: 32, Train loss: -1.5609, rewards: 0.3435\n",
      "Iteration: 33, Train loss: -1.3516, rewards: 0.2831\n",
      "Iteration: 34, Train loss: -1.2105, rewards: 0.2539\n",
      "Iteration: 35, Train loss: -1.3689, rewards: 0.2922\n",
      "Iteration: 36, Train loss: -1.3691, rewards: 0.2909\n",
      "Iteration: 37, Train loss: -1.4789, rewards: 0.3143\n",
      "Iteration: 38, Train loss: -1.5440, rewards: 0.3175\n",
      "Iteration: 39, Train loss: -1.3731, rewards: 0.3357\n",
      "Iteration: 40, Train loss: -1.4434, rewards: 0.3091\n",
      "Eval:\n",
      "Hits@1: 0.5361, Hits@3: 0.6907, Hits@10: 0.7938, MRR: 0.6242\n",
      "------------------------------------------------------------\n",
      "Iteration: 41, Train loss: -1.4245, rewards: 0.2377\n",
      "Iteration: 42, Train loss: -1.4982, rewards: 0.2643\n",
      "Iteration: 43, Train loss: -1.4482, rewards: 0.2851\n",
      "Iteration: 44, Train loss: -1.5945, rewards: 0.2727\n",
      "Iteration: 45, Train loss: -1.2665, rewards: 0.2695\n",
      "Iteration: 46, Train loss: -1.5328, rewards: 0.2831\n",
      "Iteration: 47, Train loss: -1.3013, rewards: 0.3227\n",
      "Iteration: 48, Train loss: -1.4739, rewards: 0.2591\n",
      "Iteration: 49, Train loss: -1.5695, rewards: 0.2779\n",
      "Iteration: 50, Train loss: -1.3567, rewards: 0.2740\n",
      "Eval:\n",
      "Hits@1: 0.5464, Hits@3: 0.6907, Hits@10: 0.7938, MRR: 0.6304\n",
      "------------------------------------------------------------\n",
      "Iteration: 51, Train loss: -1.3913, rewards: 0.3364\n",
      "Iteration: 52, Train loss: -1.4623, rewards: 0.2987\n",
      "Iteration: 53, Train loss: -1.3919, rewards: 0.2994\n",
      "Iteration: 54, Train loss: -1.4903, rewards: 0.2084\n",
      "Iteration: 55, Train loss: -1.4200, rewards: 0.2117\n",
      "Iteration: 56, Train loss: -1.5703, rewards: 0.2591\n",
      "Iteration: 57, Train loss: -1.4202, rewards: 0.3175\n",
      "Iteration: 58, Train loss: -1.3238, rewards: 0.3344\n",
      "Iteration: 59, Train loss: -1.3343, rewards: 0.3896\n",
      "Iteration: 60, Train loss: -1.3385, rewards: 0.3688\n",
      "Eval:\n",
      "Hits@1: 0.5876, Hits@3: 0.7629, Hits@10: 0.8351, MRR: 0.6726\n",
      "------------------------------------------------------------\n",
      "Iteration: 61, Train loss: -1.5136, rewards: 0.2403\n",
      "Iteration: 62, Train loss: -1.4319, rewards: 0.1442\n",
      "Iteration: 63, Train loss: -1.5164, rewards: 0.1935\n",
      "Iteration: 64, Train loss: -1.4444, rewards: 0.2792\n",
      "Iteration: 65, Train loss: -1.2506, rewards: 0.4208\n",
      "Iteration: 66, Train loss: -1.2879, rewards: 0.4857\n",
      "Iteration: 67, Train loss: -1.2205, rewards: 0.4753\n",
      "Iteration: 68, Train loss: -1.3149, rewards: 0.3714\n",
      "Iteration: 69, Train loss: -1.4207, rewards: 0.3013\n",
      "Iteration: 70, Train loss: -1.6874, rewards: 0.2727\n",
      "Eval:\n",
      "Hits@1: 0.6392, Hits@3: 0.7629, Hits@10: 0.8454, MRR: 0.7053\n",
      "------------------------------------------------------------\n",
      "Iteration: 71, Train loss: -1.5669, rewards: 0.2890\n",
      "Iteration: 72, Train loss: -1.5443, rewards: 0.3571\n",
      "Iteration: 73, Train loss: -1.4853, rewards: 0.3442\n",
      "Iteration: 74, Train loss: -1.3210, rewards: 0.3545\n",
      "Iteration: 75, Train loss: -1.4055, rewards: 0.3513\n",
      "Iteration: 76, Train loss: -1.5506, rewards: 0.3591\n",
      "Iteration: 77, Train loss: -1.3000, rewards: 0.2273\n",
      "Iteration: 78, Train loss: -1.3212, rewards: 0.1974\n",
      "Iteration: 79, Train loss: -1.4808, rewards: 0.3058\n",
      "Iteration: 80, Train loss: -1.5518, rewards: 0.2922\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7835, Hits@10: 0.8247, MRR: 0.7305\n",
      "------------------------------------------------------------\n",
      "Iteration: 81, Train loss: -1.4504, rewards: 0.3669\n",
      "Iteration: 82, Train loss: -1.2649, rewards: 0.3825\n",
      "Iteration: 83, Train loss: -1.3268, rewards: 0.3494\n",
      "Iteration: 84, Train loss: -1.4098, rewards: 0.3500\n",
      "Iteration: 85, Train loss: -1.4074, rewards: 0.2825\n",
      "Iteration: 86, Train loss: -1.3074, rewards: 0.2552\n",
      "Iteration: 87, Train loss: -1.5797, rewards: 0.3565\n",
      "Iteration: 88, Train loss: -1.3043, rewards: 0.3331\n",
      "Iteration: 89, Train loss: -1.2617, rewards: 0.3130\n",
      "Iteration: 90, Train loss: -1.3198, rewards: 0.3558\n",
      "Eval:\n",
      "Hits@1: 0.6082, Hits@3: 0.7423, Hits@10: 0.8247, MRR: 0.6795\n",
      "------------------------------------------------------------\n",
      "Iteration: 91, Train loss: -1.4763, rewards: 0.4058\n",
      "Iteration: 92, Train loss: -1.4590, rewards: 0.3727\n",
      "Iteration: 93, Train loss: -1.5198, rewards: 0.3584\n",
      "Iteration: 94, Train loss: -1.2354, rewards: 0.2532\n",
      "Iteration: 95, Train loss: -1.3581, rewards: 0.2578\n",
      "Iteration: 96, Train loss: -1.3621, rewards: 0.2591\n",
      "Iteration: 97, Train loss: -1.6198, rewards: 0.3435\n",
      "Iteration: 98, Train loss: -1.5217, rewards: 0.3227\n",
      "Iteration: 99, Train loss: -1.3671, rewards: 0.2494\n",
      "Iteration: 100, Train loss: -1.5077, rewards: 0.3078\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7380\n",
      "------------------------------------------------------------\n",
      "Iteration: 101, Train loss: -1.4888, rewards: 0.4065\n",
      "Iteration: 102, Train loss: -1.3260, rewards: 0.3221\n",
      "Iteration: 103, Train loss: -1.2872, rewards: 0.3494\n",
      "Iteration: 104, Train loss: -1.4667, rewards: 0.2987\n",
      "Iteration: 105, Train loss: -1.7644, rewards: 0.4214\n",
      "Iteration: 106, Train loss: -1.3643, rewards: 0.2955\n",
      "Iteration: 107, Train loss: -1.4341, rewards: 0.4312\n",
      "Iteration: 108, Train loss: -1.4156, rewards: 0.4156\n",
      "Iteration: 109, Train loss: -1.2770, rewards: 0.3688\n",
      "Iteration: 110, Train loss: -1.4891, rewards: 0.3955\n",
      "Eval:\n",
      "Hits@1: 0.6186, Hits@3: 0.7526, Hits@10: 0.8247, MRR: 0.6920\n",
      "------------------------------------------------------------\n",
      "Iteration: 111, Train loss: -1.4790, rewards: 0.3565\n",
      "Iteration: 112, Train loss: -1.3653, rewards: 0.3091\n",
      "Iteration: 113, Train loss: -1.4831, rewards: 0.3422\n",
      "Iteration: 114, Train loss: -1.2806, rewards: 0.3084\n",
      "Iteration: 115, Train loss: -1.5540, rewards: 0.3623\n",
      "Iteration: 116, Train loss: -1.4707, rewards: 0.3130\n",
      "Iteration: 117, Train loss: -1.4853, rewards: 0.3610\n",
      "Iteration: 118, Train loss: -1.2679, rewards: 0.3084\n",
      "Iteration: 119, Train loss: -1.5617, rewards: 0.3065\n",
      "Iteration: 120, Train loss: -1.3928, rewards: 0.3948\n",
      "Eval:\n",
      "Hits@1: 0.6598, Hits@3: 0.7835, Hits@10: 0.8454, MRR: 0.7240\n",
      "------------------------------------------------------------\n",
      "Iteration: 121, Train loss: -1.1736, rewards: 0.3539\n",
      "Iteration: 122, Train loss: -1.4610, rewards: 0.3851\n",
      "Iteration: 123, Train loss: -1.4713, rewards: 0.3571\n",
      "Iteration: 124, Train loss: -1.4245, rewards: 0.3110\n",
      "Iteration: 125, Train loss: -1.5264, rewards: 0.3221\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 126, Train loss: -1.4136, rewards: 0.3221\n",
      "Iteration: 127, Train loss: -1.2577, rewards: 0.3351\n",
      "Iteration: 128, Train loss: -1.4291, rewards: 0.3403\n",
      "Iteration: 129, Train loss: -1.5232, rewards: 0.3416\n",
      "Iteration: 130, Train loss: -1.3246, rewards: 0.3019\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7835, Hits@10: 0.8247, MRR: 0.7255\n",
      "------------------------------------------------------------\n",
      "Iteration: 131, Train loss: -1.5079, rewards: 0.3364\n",
      "Iteration: 132, Train loss: -1.4445, rewards: 0.3006\n",
      "Iteration: 133, Train loss: -1.3744, rewards: 0.3136\n",
      "Iteration: 134, Train loss: -1.3952, rewards: 0.3532\n",
      "Iteration: 135, Train loss: -1.1950, rewards: 0.3571\n",
      "Iteration: 136, Train loss: -1.4023, rewards: 0.3929\n",
      "Iteration: 137, Train loss: -1.4742, rewards: 0.2851\n",
      "Iteration: 138, Train loss: -1.5639, rewards: 0.2812\n",
      "Iteration: 139, Train loss: -1.4484, rewards: 0.2799\n",
      "Iteration: 140, Train loss: -1.4753, rewards: 0.2721\n",
      "Eval:\n",
      "Hits@1: 0.6598, Hits@3: 0.7835, Hits@10: 0.8454, MRR: 0.7254\n",
      "------------------------------------------------------------\n",
      "Iteration: 141, Train loss: -1.3495, rewards: 0.3981\n",
      "Iteration: 142, Train loss: -1.4938, rewards: 0.4461\n",
      "Iteration: 143, Train loss: -1.1893, rewards: 0.4714\n",
      "Iteration: 144, Train loss: -1.2715, rewards: 0.4039\n",
      "Iteration: 145, Train loss: -1.5246, rewards: 0.3383\n",
      "Iteration: 146, Train loss: -1.5696, rewards: 0.2740\n",
      "Iteration: 147, Train loss: -1.3940, rewards: 0.2370\n",
      "Iteration: 148, Train loss: -1.5412, rewards: 0.3110\n",
      "Iteration: 149, Train loss: -1.5301, rewards: 0.4097\n",
      "Iteration: 150, Train loss: -1.0147, rewards: 0.3825\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7938, Hits@10: 0.8454, MRR: 0.7403\n",
      "------------------------------------------------------------\n",
      "Iteration: 151, Train loss: -1.3198, rewards: 0.4331\n",
      "Iteration: 152, Train loss: -1.2644, rewards: 0.4208\n",
      "Iteration: 153, Train loss: -1.3358, rewards: 0.3474\n",
      "Iteration: 154, Train loss: -1.5267, rewards: 0.3221\n",
      "Iteration: 155, Train loss: -1.6699, rewards: 0.3097\n",
      "Iteration: 156, Train loss: -1.4730, rewards: 0.2909\n",
      "Iteration: 157, Train loss: -1.4237, rewards: 0.3688\n",
      "Iteration: 158, Train loss: -1.2949, rewards: 0.4643\n",
      "Iteration: 159, Train loss: -1.2906, rewards: 0.4532\n",
      "Iteration: 160, Train loss: -1.3224, rewards: 0.4156\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7835, Hits@10: 0.8351, MRR: 0.7241\n",
      "------------------------------------------------------------\n",
      "Iteration: 161, Train loss: -1.3667, rewards: 0.3331\n",
      "Iteration: 162, Train loss: -1.3759, rewards: 0.2526\n",
      "Iteration: 163, Train loss: -1.4202, rewards: 0.2292\n",
      "Iteration: 164, Train loss: -1.6262, rewards: 0.3026\n",
      "Iteration: 165, Train loss: -1.4238, rewards: 0.3201\n",
      "Iteration: 166, Train loss: -1.6307, rewards: 0.4175\n",
      "Iteration: 167, Train loss: -1.5442, rewards: 0.4526\n",
      "Iteration: 168, Train loss: -1.5005, rewards: 0.4325\n",
      "Iteration: 169, Train loss: -1.3650, rewards: 0.3429\n",
      "Iteration: 170, Train loss: -1.4008, rewards: 0.2494\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7225\n",
      "------------------------------------------------------------\n",
      "Iteration: 171, Train loss: -1.4596, rewards: 0.2682\n",
      "Iteration: 172, Train loss: -1.5817, rewards: 0.2740\n",
      "Iteration: 173, Train loss: -1.4670, rewards: 0.3753\n",
      "Iteration: 174, Train loss: -1.5006, rewards: 0.3597\n",
      "Iteration: 175, Train loss: -1.2862, rewards: 0.3325\n",
      "Iteration: 176, Train loss: -1.3448, rewards: 0.4578\n",
      "Iteration: 177, Train loss: -1.5350, rewards: 0.4266\n",
      "Iteration: 178, Train loss: -1.3733, rewards: 0.3675\n",
      "Iteration: 179, Train loss: -1.5050, rewards: 0.2864\n",
      "Iteration: 180, Train loss: -1.5648, rewards: 0.2649\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7248\n",
      "------------------------------------------------------------\n",
      "Iteration: 181, Train loss: -1.5474, rewards: 0.2851\n",
      "Iteration: 182, Train loss: -1.4938, rewards: 0.3279\n",
      "Iteration: 183, Train loss: -1.3638, rewards: 0.3247\n",
      "Iteration: 184, Train loss: -1.4120, rewards: 0.4429\n",
      "Iteration: 185, Train loss: -1.3018, rewards: 0.3416\n",
      "Iteration: 186, Train loss: -1.3619, rewards: 0.4188\n",
      "Iteration: 187, Train loss: -1.4878, rewards: 0.4175\n",
      "Iteration: 188, Train loss: -1.2912, rewards: 0.3227\n",
      "Iteration: 189, Train loss: -1.5906, rewards: 0.2844\n",
      "Iteration: 190, Train loss: -1.5685, rewards: 0.2890\n",
      "Eval:\n",
      "Hits@1: 0.6598, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7113\n",
      "------------------------------------------------------------\n",
      "Iteration: 191, Train loss: -1.3799, rewards: 0.2377\n",
      "Iteration: 192, Train loss: -1.4258, rewards: 0.3045\n",
      "Iteration: 193, Train loss: -1.3292, rewards: 0.3019\n",
      "Iteration: 194, Train loss: -1.2830, rewards: 0.3474\n",
      "Iteration: 195, Train loss: -1.2904, rewards: 0.3864\n",
      "Iteration: 196, Train loss: -1.4927, rewards: 0.4214\n",
      "Iteration: 197, Train loss: -1.2699, rewards: 0.3623\n",
      "Iteration: 198, Train loss: -1.4478, rewards: 0.3519\n",
      "Iteration: 199, Train loss: -1.2290, rewards: 0.3091\n",
      "Iteration: 200, Train loss: -1.4230, rewards: 0.3299\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7223\n",
      "------------------------------------------------------------\n",
      "Iteration: 201, Train loss: -1.6171, rewards: 0.3175\n",
      "Iteration: 202, Train loss: -1.4375, rewards: 0.2279\n",
      "Iteration: 203, Train loss: -1.5428, rewards: 0.2442\n",
      "Iteration: 204, Train loss: -1.4865, rewards: 0.2857\n",
      "Iteration: 205, Train loss: -1.3434, rewards: 0.2857\n",
      "Iteration: 206, Train loss: -1.4273, rewards: 0.3753\n",
      "Iteration: 207, Train loss: -1.4442, rewards: 0.5091\n",
      "Iteration: 208, Train loss: -1.4510, rewards: 0.4104\n",
      "Iteration: 209, Train loss: -1.3212, rewards: 0.3474\n",
      "Iteration: 210, Train loss: -1.4205, rewards: 0.2506\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7229\n",
      "------------------------------------------------------------\n",
      "Iteration: 211, Train loss: -1.4418, rewards: 0.2727\n",
      "Iteration: 212, Train loss: -1.3965, rewards: 0.2610\n",
      "Iteration: 213, Train loss: -1.4974, rewards: 0.3630\n",
      "Iteration: 214, Train loss: -1.3505, rewards: 0.3292\n",
      "Iteration: 215, Train loss: -1.5483, rewards: 0.3636\n",
      "Iteration: 216, Train loss: -1.3982, rewards: 0.4481\n",
      "Iteration: 217, Train loss: -1.5123, rewards: 0.4409\n",
      "Iteration: 218, Train loss: -1.5786, rewards: 0.4097\n",
      "Iteration: 219, Train loss: -1.3899, rewards: 0.3169\n",
      "Iteration: 220, Train loss: -1.5759, rewards: 0.3156\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7206\n",
      "------------------------------------------------------------\n",
      "Iteration: 221, Train loss: -1.4196, rewards: 0.2961\n",
      "Iteration: 222, Train loss: -1.4872, rewards: 0.2903\n",
      "Iteration: 223, Train loss: -1.5161, rewards: 0.4104\n",
      "Iteration: 224, Train loss: -1.3912, rewards: 0.4143\n",
      "Iteration: 225, Train loss: -1.4420, rewards: 0.4221\n",
      "Iteration: 226, Train loss: -1.2908, rewards: 0.4117\n",
      "Iteration: 227, Train loss: -1.4459, rewards: 0.3045\n",
      "Iteration: 228, Train loss: -1.5830, rewards: 0.3513\n",
      "Iteration: 229, Train loss: -1.5767, rewards: 0.3110\n",
      "Iteration: 230, Train loss: -1.4870, rewards: 0.3442\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7938, Hits@10: 0.8144, MRR: 0.7456\n",
      "------------------------------------------------------------\n",
      "Iteration: 231, Train loss: -1.5007, rewards: 0.3578\n",
      "Iteration: 232, Train loss: -1.3672, rewards: 0.3506\n",
      "Iteration: 233, Train loss: -1.3382, rewards: 0.4162\n",
      "Iteration: 234, Train loss: -1.3693, rewards: 0.5052\n",
      "Iteration: 235, Train loss: -1.4184, rewards: 0.3597\n",
      "Iteration: 236, Train loss: -1.3049, rewards: 0.3175\n",
      "Iteration: 237, Train loss: -1.4001, rewards: 0.3162\n",
      "Iteration: 238, Train loss: -1.3605, rewards: 0.3396\n",
      "Iteration: 239, Train loss: -1.4549, rewards: 0.3312\n",
      "Iteration: 240, Train loss: -1.5807, rewards: 0.3247\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7302\n",
      "------------------------------------------------------------\n",
      "Iteration: 241, Train loss: -1.2564, rewards: 0.3045\n",
      "Iteration: 242, Train loss: -1.5400, rewards: 0.3422\n",
      "Iteration: 243, Train loss: -1.3764, rewards: 0.3506\n",
      "Iteration: 244, Train loss: -1.4231, rewards: 0.3721\n",
      "Iteration: 245, Train loss: -1.4959, rewards: 0.3617\n",
      "Iteration: 246, Train loss: -1.2637, rewards: 0.3494\n",
      "Iteration: 247, Train loss: -1.5838, rewards: 0.3870\n",
      "Iteration: 248, Train loss: -1.5608, rewards: 0.3474\n",
      "Iteration: 249, Train loss: -1.6196, rewards: 0.4208\n",
      "Iteration: 250, Train loss: -1.6495, rewards: 0.4201\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7374\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 251, Train loss: -1.4363, rewards: 0.4045\n",
      "Iteration: 252, Train loss: -1.5191, rewards: 0.3935\n",
      "Iteration: 253, Train loss: -1.5003, rewards: 0.3643\n",
      "Iteration: 254, Train loss: -1.2315, rewards: 0.4318\n",
      "Iteration: 255, Train loss: -1.3969, rewards: 0.3312\n",
      "Iteration: 256, Train loss: -1.4534, rewards: 0.3435\n",
      "Iteration: 257, Train loss: -1.3342, rewards: 0.2779\n",
      "Iteration: 258, Train loss: -1.5685, rewards: 0.3377\n",
      "Iteration: 259, Train loss: -1.4720, rewards: 0.3052\n",
      "Iteration: 260, Train loss: -1.6298, rewards: 0.4377\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7263\n",
      "------------------------------------------------------------\n",
      "Iteration: 261, Train loss: -1.3468, rewards: 0.3708\n",
      "Iteration: 262, Train loss: -1.1375, rewards: 0.3461\n",
      "Iteration: 263, Train loss: -1.3415, rewards: 0.3922\n",
      "Iteration: 264, Train loss: -1.4316, rewards: 0.3195\n",
      "Iteration: 265, Train loss: -1.3221, rewards: 0.2669\n",
      "Iteration: 266, Train loss: -1.3953, rewards: 0.3286\n",
      "Iteration: 267, Train loss: -1.1967, rewards: 0.2812\n",
      "Iteration: 268, Train loss: -1.2739, rewards: 0.3903\n",
      "Iteration: 269, Train loss: -1.3685, rewards: 0.3916\n",
      "Iteration: 270, Train loss: -1.4563, rewards: 0.4481\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7273\n",
      "------------------------------------------------------------\n",
      "Iteration: 271, Train loss: -1.3894, rewards: 0.4156\n",
      "Iteration: 272, Train loss: -1.5162, rewards: 0.3416\n",
      "Iteration: 273, Train loss: -1.5827, rewards: 0.3909\n",
      "Iteration: 274, Train loss: -1.3235, rewards: 0.3169\n",
      "Iteration: 275, Train loss: -1.3776, rewards: 0.2948\n",
      "Iteration: 276, Train loss: -1.3551, rewards: 0.3558\n",
      "Iteration: 277, Train loss: -1.4717, rewards: 0.3383\n",
      "Iteration: 278, Train loss: -1.3769, rewards: 0.4591\n",
      "Iteration: 279, Train loss: -1.2164, rewards: 0.4032\n",
      "Iteration: 280, Train loss: -1.4901, rewards: 0.4409\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7250\n",
      "------------------------------------------------------------\n",
      "Iteration: 281, Train loss: -1.6978, rewards: 0.4377\n",
      "Iteration: 282, Train loss: -1.5123, rewards: 0.3286\n",
      "Iteration: 283, Train loss: -1.4350, rewards: 0.3695\n",
      "Iteration: 284, Train loss: -1.5725, rewards: 0.3123\n",
      "Iteration: 285, Train loss: -1.3586, rewards: 0.3597\n",
      "Iteration: 286, Train loss: -1.3931, rewards: 0.3390\n",
      "Iteration: 287, Train loss: -1.3597, rewards: 0.3247\n",
      "Iteration: 288, Train loss: -1.4269, rewards: 0.4136\n",
      "Iteration: 289, Train loss: -1.4926, rewards: 0.4519\n",
      "Iteration: 290, Train loss: -1.2727, rewards: 0.3857\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7427\n",
      "------------------------------------------------------------\n",
      "Iteration: 291, Train loss: -1.4581, rewards: 0.3721\n",
      "Iteration: 292, Train loss: -1.5078, rewards: 0.3799\n",
      "Iteration: 293, Train loss: -1.4151, rewards: 0.3338\n",
      "Iteration: 294, Train loss: -1.4409, rewards: 0.3052\n",
      "Iteration: 295, Train loss: -1.6634, rewards: 0.2955\n",
      "Iteration: 296, Train loss: -1.6103, rewards: 0.4078\n",
      "Iteration: 297, Train loss: -1.4486, rewards: 0.3688\n",
      "Iteration: 298, Train loss: -1.6041, rewards: 0.3825\n",
      "Iteration: 299, Train loss: -1.4646, rewards: 0.3701\n",
      "Iteration: 300, Train loss: -1.4463, rewards: 0.4253\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7440\n",
      "------------------------------------------------------------\n",
      "Iteration: 301, Train loss: -1.3359, rewards: 0.3909\n",
      "Iteration: 302, Train loss: -1.4632, rewards: 0.3409\n",
      "Iteration: 303, Train loss: -1.4882, rewards: 0.3318\n",
      "Iteration: 304, Train loss: -1.6526, rewards: 0.3916\n",
      "Iteration: 305, Train loss: -1.5317, rewards: 0.3974\n",
      "Iteration: 306, Train loss: -1.5777, rewards: 0.3721\n",
      "Iteration: 307, Train loss: -1.3268, rewards: 0.2682\n",
      "Iteration: 308, Train loss: -1.6060, rewards: 0.3591\n",
      "Iteration: 309, Train loss: -1.6142, rewards: 0.3377\n",
      "Iteration: 310, Train loss: -1.2350, rewards: 0.3571\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7463\n",
      "------------------------------------------------------------\n",
      "Iteration: 311, Train loss: -1.2887, rewards: 0.3786\n",
      "Iteration: 312, Train loss: -1.2235, rewards: 0.4019\n",
      "Iteration: 313, Train loss: -1.2733, rewards: 0.3916\n",
      "Iteration: 314, Train loss: -1.3962, rewards: 0.3799\n",
      "Iteration: 315, Train loss: -1.4111, rewards: 0.3331\n",
      "Iteration: 316, Train loss: -1.4124, rewards: 0.3513\n",
      "Iteration: 317, Train loss: -1.5872, rewards: 0.3727\n",
      "Iteration: 318, Train loss: -1.2025, rewards: 0.3987\n",
      "Iteration: 319, Train loss: -1.2878, rewards: 0.3851\n",
      "Iteration: 320, Train loss: -1.3681, rewards: 0.3526\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7453\n",
      "------------------------------------------------------------\n",
      "Iteration: 321, Train loss: -1.4361, rewards: 0.3474\n",
      "Iteration: 322, Train loss: -1.3979, rewards: 0.3500\n",
      "Iteration: 323, Train loss: -1.4489, rewards: 0.4169\n",
      "Iteration: 324, Train loss: -1.2829, rewards: 0.3643\n",
      "Iteration: 325, Train loss: -1.3692, rewards: 0.3630\n",
      "Iteration: 326, Train loss: -1.3432, rewards: 0.3760\n",
      "Iteration: 327, Train loss: -1.5038, rewards: 0.2649\n",
      "Iteration: 328, Train loss: -1.4293, rewards: 0.2864\n",
      "Iteration: 329, Train loss: -1.5440, rewards: 0.3169\n",
      "Iteration: 330, Train loss: -1.3282, rewards: 0.2844\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7413\n",
      "------------------------------------------------------------\n",
      "Iteration: 331, Train loss: -1.4189, rewards: 0.3175\n",
      "Iteration: 332, Train loss: -1.3574, rewards: 0.3292\n",
      "Iteration: 333, Train loss: -1.5474, rewards: 0.5130\n",
      "Iteration: 334, Train loss: -1.4112, rewards: 0.4084\n",
      "Iteration: 335, Train loss: -1.2555, rewards: 0.3831\n",
      "Iteration: 336, Train loss: -1.5667, rewards: 0.3844\n",
      "Iteration: 337, Train loss: -1.5129, rewards: 0.3604\n",
      "Iteration: 338, Train loss: -1.4043, rewards: 0.3208\n",
      "Iteration: 339, Train loss: -1.4627, rewards: 0.3247\n",
      "Iteration: 340, Train loss: -1.5822, rewards: 0.3688\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7465\n",
      "------------------------------------------------------------\n",
      "Iteration: 341, Train loss: -1.4151, rewards: 0.3260\n",
      "Iteration: 342, Train loss: -1.4012, rewards: 0.3851\n",
      "Iteration: 343, Train loss: -1.4380, rewards: 0.4188\n",
      "Iteration: 344, Train loss: -1.5374, rewards: 0.4416\n",
      "Iteration: 345, Train loss: -1.3835, rewards: 0.4565\n",
      "Iteration: 346, Train loss: -1.3670, rewards: 0.2929\n",
      "Iteration: 347, Train loss: -1.5077, rewards: 0.3299\n",
      "Iteration: 348, Train loss: -1.3973, rewards: 0.2747\n",
      "Iteration: 349, Train loss: -1.3333, rewards: 0.3403\n",
      "Iteration: 350, Train loss: -1.4386, rewards: 0.4013\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7408\n",
      "------------------------------------------------------------\n",
      "Iteration: 351, Train loss: -1.3794, rewards: 0.4331\n",
      "Iteration: 352, Train loss: -1.5203, rewards: 0.4208\n",
      "Iteration: 353, Train loss: -1.3793, rewards: 0.3351\n",
      "Iteration: 354, Train loss: -1.4389, rewards: 0.3779\n",
      "Iteration: 355, Train loss: -1.4387, rewards: 0.3812\n",
      "Iteration: 356, Train loss: -1.4463, rewards: 0.3688\n",
      "Iteration: 357, Train loss: -1.4971, rewards: 0.3299\n",
      "Iteration: 358, Train loss: -1.5358, rewards: 0.3870\n",
      "Iteration: 359, Train loss: -1.6047, rewards: 0.4143\n",
      "Iteration: 360, Train loss: -1.4042, rewards: 0.3675\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7342\n",
      "------------------------------------------------------------\n",
      "Iteration: 361, Train loss: -1.5028, rewards: 0.3734\n",
      "Iteration: 362, Train loss: -1.3874, rewards: 0.3961\n",
      "Iteration: 363, Train loss: -1.3531, rewards: 0.3506\n",
      "Iteration: 364, Train loss: -1.4484, rewards: 0.3623\n",
      "Iteration: 365, Train loss: -1.3765, rewards: 0.3812\n",
      "Iteration: 366, Train loss: -1.4726, rewards: 0.3435\n",
      "Iteration: 367, Train loss: -1.1867, rewards: 0.2662\n",
      "Iteration: 368, Train loss: -1.4419, rewards: 0.3169\n",
      "Iteration: 369, Train loss: -1.4184, rewards: 0.3740\n",
      "Iteration: 370, Train loss: -1.3861, rewards: 0.3526\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7436\n",
      "------------------------------------------------------------\n",
      "Iteration: 371, Train loss: -1.2226, rewards: 0.3922\n",
      "Iteration: 372, Train loss: -1.5281, rewards: 0.4727\n",
      "Iteration: 373, Train loss: -1.4139, rewards: 0.3974\n",
      "Iteration: 374, Train loss: -1.4225, rewards: 0.2896\n",
      "Iteration: 375, Train loss: -1.3715, rewards: 0.3227\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 376, Train loss: -1.7902, rewards: 0.3877\n",
      "Iteration: 377, Train loss: -1.3877, rewards: 0.2799\n",
      "Iteration: 378, Train loss: -1.4274, rewards: 0.3084\n",
      "Iteration: 379, Train loss: -1.4005, rewards: 0.3981\n",
      "Iteration: 380, Train loss: -1.2564, rewards: 0.3721\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7394\n",
      "------------------------------------------------------------\n",
      "Iteration: 381, Train loss: -1.2123, rewards: 0.4370\n",
      "Iteration: 382, Train loss: -1.3716, rewards: 0.3929\n",
      "Iteration: 383, Train loss: -1.5292, rewards: 0.3994\n",
      "Iteration: 384, Train loss: -1.4539, rewards: 0.3474\n",
      "Iteration: 385, Train loss: -1.6045, rewards: 0.3065\n",
      "Iteration: 386, Train loss: -1.6026, rewards: 0.2961\n",
      "Iteration: 387, Train loss: -1.3134, rewards: 0.3695\n",
      "Iteration: 388, Train loss: -1.5138, rewards: 0.3273\n",
      "Iteration: 389, Train loss: -1.4482, rewards: 0.3766\n",
      "Iteration: 390, Train loss: -1.6383, rewards: 0.4844\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7394\n",
      "------------------------------------------------------------\n",
      "Iteration: 391, Train loss: -1.4716, rewards: 0.4143\n",
      "Iteration: 392, Train loss: -1.3747, rewards: 0.3442\n",
      "Iteration: 393, Train loss: -1.6308, rewards: 0.3727\n",
      "Iteration: 394, Train loss: -1.5037, rewards: 0.3078\n",
      "Iteration: 395, Train loss: -1.4157, rewards: 0.3143\n",
      "Iteration: 396, Train loss: -1.5489, rewards: 0.3474\n",
      "Iteration: 397, Train loss: -1.1987, rewards: 0.3630\n",
      "Iteration: 398, Train loss: -1.4244, rewards: 0.4156\n",
      "Iteration: 399, Train loss: -1.3822, rewards: 0.4481\n",
      "Iteration: 400, Train loss: -1.6018, rewards: 0.3636\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7379\n",
      "------------------------------------------------------------\n",
      "Iteration: 401, Train loss: -1.5312, rewards: 0.3474\n",
      "Iteration: 402, Train loss: -1.3920, rewards: 0.3532\n",
      "Iteration: 403, Train loss: -1.4731, rewards: 0.3545\n",
      "Iteration: 404, Train loss: -1.4205, rewards: 0.2792\n",
      "Iteration: 405, Train loss: -1.4930, rewards: 0.3084\n",
      "Iteration: 406, Train loss: -1.5312, rewards: 0.3539\n",
      "Iteration: 407, Train loss: -1.5845, rewards: 0.3929\n",
      "Iteration: 408, Train loss: -1.3310, rewards: 0.4279\n",
      "Iteration: 409, Train loss: -1.2960, rewards: 0.3474\n",
      "Iteration: 410, Train loss: -1.2685, rewards: 0.4649\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7629, Hits@10: 0.8144, MRR: 0.7368\n",
      "------------------------------------------------------------\n",
      "Iteration: 411, Train loss: -1.5825, rewards: 0.3591\n",
      "Iteration: 412, Train loss: -1.4724, rewards: 0.4110\n",
      "Iteration: 413, Train loss: -1.4375, rewards: 0.2734\n",
      "Iteration: 414, Train loss: -1.3592, rewards: 0.3338\n",
      "Iteration: 415, Train loss: -1.3615, rewards: 0.4513\n",
      "Iteration: 416, Train loss: -1.4273, rewards: 0.4364\n",
      "Iteration: 417, Train loss: -1.3191, rewards: 0.4266\n",
      "Iteration: 418, Train loss: -1.4679, rewards: 0.4253\n",
      "Iteration: 419, Train loss: -1.6422, rewards: 0.4292\n",
      "Iteration: 420, Train loss: -1.6345, rewards: 0.3968\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7461\n",
      "------------------------------------------------------------\n",
      "Iteration: 421, Train loss: -1.4763, rewards: 0.3188\n",
      "Iteration: 422, Train loss: -1.3381, rewards: 0.3214\n",
      "Iteration: 423, Train loss: -1.4734, rewards: 0.4175\n",
      "Iteration: 424, Train loss: -1.4428, rewards: 0.3955\n",
      "Iteration: 425, Train loss: -1.3276, rewards: 0.3545\n",
      "Iteration: 426, Train loss: -1.4966, rewards: 0.3662\n",
      "Iteration: 427, Train loss: -1.2707, rewards: 0.3701\n",
      "Iteration: 428, Train loss: -1.4869, rewards: 0.3604\n",
      "Iteration: 429, Train loss: -1.3432, rewards: 0.3071\n",
      "Iteration: 430, Train loss: -1.3792, rewards: 0.3325\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7323\n",
      "------------------------------------------------------------\n",
      "Iteration: 431, Train loss: -1.4480, rewards: 0.3383\n",
      "Iteration: 432, Train loss: -1.4237, rewards: 0.4019\n",
      "Iteration: 433, Train loss: -1.5963, rewards: 0.3818\n",
      "Iteration: 434, Train loss: -1.4343, rewards: 0.4708\n",
      "Iteration: 435, Train loss: -1.2620, rewards: 0.4753\n",
      "Iteration: 436, Train loss: -1.4045, rewards: 0.4636\n",
      "Iteration: 437, Train loss: -1.4838, rewards: 0.3195\n",
      "Iteration: 438, Train loss: -1.4203, rewards: 0.3071\n",
      "Iteration: 439, Train loss: -1.6076, rewards: 0.4182\n",
      "Iteration: 440, Train loss: -1.2026, rewards: 0.2838\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7394\n",
      "------------------------------------------------------------\n",
      "Iteration: 441, Train loss: -1.4102, rewards: 0.3818\n",
      "Iteration: 442, Train loss: -1.4827, rewards: 0.4006\n",
      "Iteration: 443, Train loss: -1.2887, rewards: 0.4636\n",
      "Iteration: 444, Train loss: -1.2751, rewards: 0.3929\n",
      "Iteration: 445, Train loss: -1.4420, rewards: 0.3643\n",
      "Iteration: 446, Train loss: -1.3108, rewards: 0.2558\n",
      "Iteration: 447, Train loss: -1.5037, rewards: 0.2786\n",
      "Iteration: 448, Train loss: -1.2458, rewards: 0.2474\n",
      "Iteration: 449, Train loss: -1.6599, rewards: 0.3299\n",
      "Iteration: 450, Train loss: -1.4798, rewards: 0.3383\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7461\n",
      "------------------------------------------------------------\n",
      "Iteration: 451, Train loss: -1.5574, rewards: 0.4227\n",
      "Iteration: 452, Train loss: -1.4613, rewards: 0.4292\n",
      "Iteration: 453, Train loss: -1.2374, rewards: 0.4597\n",
      "Iteration: 454, Train loss: -1.4059, rewards: 0.3188\n",
      "Iteration: 455, Train loss: -1.2923, rewards: 0.2903\n",
      "Iteration: 456, Train loss: -1.4507, rewards: 0.3442\n",
      "Iteration: 457, Train loss: -1.4785, rewards: 0.3344\n",
      "Iteration: 458, Train loss: -1.2838, rewards: 0.2844\n",
      "Iteration: 459, Train loss: -1.4070, rewards: 0.3916\n",
      "Iteration: 460, Train loss: -1.3769, rewards: 0.3747\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7499\n",
      "------------------------------------------------------------\n",
      "Iteration: 461, Train loss: -1.4917, rewards: 0.4526\n",
      "Iteration: 462, Train loss: -1.2535, rewards: 0.4643\n",
      "Iteration: 463, Train loss: -1.4441, rewards: 0.4591\n",
      "Iteration: 464, Train loss: -1.5373, rewards: 0.3812\n",
      "Iteration: 465, Train loss: -1.5689, rewards: 0.3558\n",
      "Iteration: 466, Train loss: -1.3889, rewards: 0.2747\n",
      "Iteration: 467, Train loss: -1.3680, rewards: 0.3805\n",
      "Iteration: 468, Train loss: -1.2994, rewards: 0.4305\n",
      "Iteration: 469, Train loss: -1.3610, rewards: 0.3701\n",
      "Iteration: 470, Train loss: -1.2219, rewards: 0.3623\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7732, Hits@10: 0.8144, MRR: 0.7340\n",
      "------------------------------------------------------------\n",
      "Iteration: 471, Train loss: -1.3238, rewards: 0.3792\n",
      "Iteration: 472, Train loss: -1.2572, rewards: 0.3968\n",
      "Iteration: 473, Train loss: -1.4493, rewards: 0.4143\n",
      "Iteration: 474, Train loss: -1.4406, rewards: 0.3942\n",
      "Iteration: 475, Train loss: -1.4407, rewards: 0.3675\n",
      "Iteration: 476, Train loss: -1.4571, rewards: 0.3461\n",
      "Iteration: 477, Train loss: -1.3050, rewards: 0.3234\n",
      "Iteration: 478, Train loss: -1.5756, rewards: 0.4032\n",
      "Iteration: 479, Train loss: -1.3745, rewards: 0.4364\n",
      "Iteration: 480, Train loss: -1.4393, rewards: 0.4357\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7835, Hits@10: 0.8247, MRR: 0.7470\n",
      "------------------------------------------------------------\n",
      "Iteration: 481, Train loss: -1.3912, rewards: 0.4013\n",
      "Iteration: 482, Train loss: -1.3530, rewards: 0.3786\n",
      "Iteration: 483, Train loss: -1.4234, rewards: 0.3766\n",
      "Iteration: 484, Train loss: -1.2683, rewards: 0.4065\n",
      "Iteration: 485, Train loss: -1.3916, rewards: 0.3630\n",
      "Iteration: 486, Train loss: -1.2440, rewards: 0.2974\n",
      "Iteration: 487, Train loss: -1.4977, rewards: 0.3175\n",
      "Iteration: 488, Train loss: -1.4177, rewards: 0.3260\n",
      "Iteration: 489, Train loss: -1.3252, rewards: 0.3987\n",
      "Iteration: 490, Train loss: -1.2319, rewards: 0.3987\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7427\n",
      "------------------------------------------------------------\n",
      "Iteration: 491, Train loss: -1.4545, rewards: 0.4630\n",
      "Iteration: 492, Train loss: -1.4602, rewards: 0.4597\n",
      "Iteration: 493, Train loss: -1.6095, rewards: 0.4390\n",
      "Iteration: 494, Train loss: -1.3017, rewards: 0.2955\n",
      "Iteration: 495, Train loss: -1.5301, rewards: 0.3981\n",
      "Iteration: 496, Train loss: -1.5545, rewards: 0.4169\n",
      "Iteration: 497, Train loss: -1.5573, rewards: 0.3916\n",
      "Iteration: 498, Train loss: -1.4994, rewards: 0.4058\n",
      "Iteration: 499, Train loss: -1.5086, rewards: 0.4435\n",
      "Iteration: 500, Train loss: -1.4078, rewards: 0.3312\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7420\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------------------------------------------------------\n",
      "Iteration: 501, Train loss: -1.3808, rewards: 0.3338\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.5179, Hits@3: 0.7768, Hits@10: 0.8750, MRR: 0.6598\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.7897534013605442 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 22:31:16,865]\u001b[0m Trial 3 finished with value: 0.7897534013605442 and parameters: {'lr': 0.005524424877621921, 'bs': 77, 'b': 0.45623454548569337, 'l': 0.48059195845638003, 'ee': 10}. Best is trial 3 with value: 0.7897534013605442.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 10, Train loss: -0.7530, rewards: 0.1979\n",
      "Iteration: 20, Train loss: -1.0062, rewards: 0.3437\n",
      "Iteration: 30, Train loss: -1.1787, rewards: 0.3544\n",
      "Iteration: 40, Train loss: -1.0328, rewards: 0.4480\n",
      "Iteration: 50, Train loss: -1.0642, rewards: 0.4697\n",
      "Iteration: 60, Train loss: -0.9292, rewards: 0.4905\n",
      "Iteration: 70, Train loss: -0.8947, rewards: 0.5174\n",
      "Iteration: 80, Train loss: -0.9036, rewards: 0.5356\n",
      "Iteration: 90, Train loss: -0.9113, rewards: 0.5142\n",
      "Iteration: 100, Train loss: -0.9165, rewards: 0.5840\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.8041, Hits@10: 0.8247, MRR: 0.7852\n",
      "------------------------------------------------------------\n",
      "Iteration: 110, Train loss: -0.7985, rewards: 0.5518\n",
      "Iteration: 120, Train loss: -0.8610, rewards: 0.5487\n",
      "Iteration: 130, Train loss: -0.8415, rewards: 0.5556\n",
      "Iteration: 140, Train loss: -0.7630, rewards: 0.5856\n",
      "Iteration: 150, Train loss: -0.7117, rewards: 0.5995\n",
      "Iteration: 160, Train loss: -0.8434, rewards: 0.5712\n",
      "Iteration: 170, Train loss: -0.7885, rewards: 0.5810\n",
      "Iteration: 180, Train loss: -0.8445, rewards: 0.5612\n",
      "Iteration: 190, Train loss: -0.7259, rewards: 0.6199\n",
      "Iteration: 200, Train loss: -0.8640, rewards: 0.5836\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.8041, Hits@10: 0.8144, MRR: 0.7844\n",
      "------------------------------------------------------------\n",
      "Iteration: 210, Train loss: -0.8170, rewards: 0.6091\n",
      "Iteration: 220, Train loss: -0.7925, rewards: 0.5816\n",
      "Iteration: 230, Train loss: -0.7137, rewards: 0.6145\n",
      "Iteration: 240, Train loss: -0.7657, rewards: 0.6021\n",
      "Iteration: 250, Train loss: -0.7498, rewards: 0.6142\n",
      "Iteration: 260, Train loss: -0.7433, rewards: 0.6147\n",
      "Iteration: 270, Train loss: -0.8823, rewards: 0.5522\n",
      "Iteration: 280, Train loss: -0.8100, rewards: 0.5962\n",
      "Iteration: 290, Train loss: -0.7643, rewards: 0.6405\n",
      "Iteration: 300, Train loss: -0.7792, rewards: 0.6009\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7730\n",
      "------------------------------------------------------------\n",
      "Iteration: 310, Train loss: -0.7353, rewards: 0.6458\n",
      "Iteration: 320, Train loss: -0.6862, rewards: 0.6456\n",
      "Iteration: 330, Train loss: -0.7731, rewards: 0.6363\n",
      "Iteration: 340, Train loss: -0.7569, rewards: 0.6252\n",
      "Iteration: 350, Train loss: -0.7282, rewards: 0.5995\n",
      "Iteration: 360, Train loss: -0.7172, rewards: 0.6380\n",
      "Iteration: 370, Train loss: -0.7814, rewards: 0.6066\n",
      "Iteration: 380, Train loss: -0.7220, rewards: 0.6276\n",
      "Iteration: 390, Train loss: -0.7618, rewards: 0.6182\n",
      "Iteration: 400, Train loss: -0.7539, rewards: 0.6442\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7938, Hits@10: 0.8144, MRR: 0.7702\n",
      "------------------------------------------------------------\n",
      "Iteration: 410, Train loss: -0.7341, rewards: 0.6195\n",
      "Iteration: 420, Train loss: -0.7242, rewards: 0.6326\n",
      "Iteration: 430, Train loss: -0.7872, rewards: 0.5904\n",
      "Iteration: 440, Train loss: -0.7013, rewards: 0.6486\n",
      "Iteration: 450, Train loss: -0.6798, rewards: 0.6466\n",
      "Iteration: 460, Train loss: -0.6769, rewards: 0.6894\n",
      "Iteration: 470, Train loss: -0.5915, rewards: 0.6860\n",
      "Iteration: 480, Train loss: -0.8057, rewards: 0.5999\n",
      "Iteration: 490, Train loss: -0.6964, rewards: 0.6418\n",
      "Iteration: 500, Train loss: -0.7100, rewards: 0.6360\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7822\n",
      "------------------------------------------------------------\n",
      "Iteration: 510, Train loss: -0.7502, rewards: 0.6315\n",
      "Iteration: 520, Train loss: -0.7463, rewards: 0.6020\n",
      "Iteration: 530, Train loss: -0.5812, rewards: 0.6715\n",
      "Iteration: 540, Train loss: -0.7077, rewards: 0.6538\n",
      "Iteration: 550, Train loss: -0.7499, rewards: 0.6454\n",
      "Iteration: 560, Train loss: -0.7120, rewards: 0.6630\n",
      "Iteration: 570, Train loss: -0.7820, rewards: 0.6333\n",
      "Iteration: 580, Train loss: -0.7255, rewards: 0.6608\n",
      "Iteration: 590, Train loss: -0.6796, rewards: 0.6660\n",
      "Iteration: 600, Train loss: -0.7545, rewards: 0.6320\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7689\n",
      "------------------------------------------------------------\n",
      "Iteration: 610, Train loss: -0.6132, rewards: 0.6924\n",
      "Iteration: 620, Train loss: -0.6533, rewards: 0.6389\n",
      "Iteration: 630, Train loss: -0.7172, rewards: 0.6450\n",
      "Iteration: 640, Train loss: -0.6935, rewards: 0.6589\n",
      "Iteration: 650, Train loss: -0.6603, rewards: 0.6885\n",
      "Iteration: 660, Train loss: -0.6479, rewards: 0.6852\n",
      "Iteration: 670, Train loss: -0.6715, rewards: 0.6700\n",
      "Iteration: 680, Train loss: -0.6364, rewards: 0.6831\n",
      "Iteration: 690, Train loss: -0.7049, rewards: 0.6275\n",
      "Iteration: 700, Train loss: -0.6573, rewards: 0.6579\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7842\n",
      "------------------------------------------------------------\n",
      "Iteration: 710, Train loss: -0.6866, rewards: 0.6536\n",
      "Iteration: 720, Train loss: -0.6033, rewards: 0.6763\n",
      "Iteration: 730, Train loss: -0.7135, rewards: 0.6220\n",
      "Iteration: 740, Train loss: -0.6615, rewards: 0.6760\n",
      "Iteration: 750, Train loss: -0.6124, rewards: 0.6925\n",
      "Iteration: 760, Train loss: -0.5772, rewards: 0.6795\n",
      "Iteration: 770, Train loss: -0.6362, rewards: 0.6404\n",
      "Iteration: 780, Train loss: -0.5582, rewards: 0.7063\n",
      "Iteration: 790, Train loss: -0.6477, rewards: 0.6544\n",
      "Iteration: 800, Train loss: -0.6837, rewards: 0.6732\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7663\n",
      "------------------------------------------------------------\n",
      "Iteration: 810, Train loss: -0.6419, rewards: 0.6814\n",
      "Iteration: 820, Train loss: -0.6489, rewards: 0.6784\n",
      "Iteration: 830, Train loss: -0.6397, rewards: 0.6904\n",
      "Iteration: 840, Train loss: -0.6853, rewards: 0.6721\n",
      "Iteration: 850, Train loss: -0.5505, rewards: 0.6719\n",
      "Iteration: 860, Train loss: -0.7195, rewards: 0.6034\n",
      "Iteration: 870, Train loss: -0.6275, rewards: 0.6513\n",
      "Iteration: 880, Train loss: -0.7292, rewards: 0.6702\n",
      "Iteration: 890, Train loss: -0.5945, rewards: 0.6590\n",
      "Iteration: 900, Train loss: -0.6428, rewards: 0.6804\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7735\n",
      "------------------------------------------------------------\n",
      "Iteration: 910, Train loss: -0.6614, rewards: 0.7056\n",
      "Iteration: 920, Train loss: -0.6187, rewards: 0.6820\n",
      "Iteration: 930, Train loss: -0.5722, rewards: 0.6899\n",
      "Iteration: 940, Train loss: -0.7454, rewards: 0.6573\n",
      "Iteration: 950, Train loss: -0.5553, rewards: 0.7149\n",
      "Iteration: 960, Train loss: -0.6625, rewards: 0.6618\n",
      "Iteration: 970, Train loss: -0.6188, rewards: 0.6854\n",
      "Iteration: 980, Train loss: -0.5747, rewards: 0.6850\n",
      "Iteration: 990, Train loss: -0.7107, rewards: 0.6267\n",
      "Iteration: 1000, Train loss: -0.6766, rewards: 0.6736\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7741\n",
      "------------------------------------------------------------\n",
      "Iteration: 1010, Train loss: -0.6692, rewards: 0.6721\n",
      "Iteration: 1020, Train loss: -0.6540, rewards: 0.6624\n",
      "Iteration: 1030, Train loss: -0.6082, rewards: 0.7051\n",
      "Iteration: 1040, Train loss: -0.5659, rewards: 0.6934\n",
      "Iteration: 1050, Train loss: -0.7024, rewards: 0.6674\n",
      "Iteration: 1060, Train loss: -0.5795, rewards: 0.6910\n",
      "Iteration: 1070, Train loss: -0.6418, rewards: 0.6730\n",
      "Iteration: 1080, Train loss: -0.7175, rewards: 0.6542\n",
      "Iteration: 1090, Train loss: -0.5805, rewards: 0.6855\n",
      "Iteration: 1100, Train loss: -0.6528, rewards: 0.6892\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7792\n",
      "------------------------------------------------------------\n",
      "Iteration: 1110, Train loss: -0.5984, rewards: 0.6938\n",
      "Iteration: 1120, Train loss: -0.5655, rewards: 0.6779\n",
      "Iteration: 1130, Train loss: -0.6694, rewards: 0.6779\n",
      "Iteration: 1140, Train loss: -0.6145, rewards: 0.7066\n",
      "Iteration: 1150, Train loss: -0.6524, rewards: 0.6860\n",
      "Iteration: 1160, Train loss: -0.7215, rewards: 0.6937\n",
      "Iteration: 1170, Train loss: -0.5827, rewards: 0.6726\n",
      "Iteration: 1180, Train loss: -0.6427, rewards: 0.6887\n",
      "Iteration: 1190, Train loss: -0.6471, rewards: 0.6382\n",
      "Iteration: 1200, Train loss: -0.6646, rewards: 0.6733\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7672\n",
      "------------------------------------------------------------\n",
      "Iteration: 1210, Train loss: -0.6088, rewards: 0.6950\n",
      "Iteration: 1220, Train loss: -0.6248, rewards: 0.7089\n",
      "Iteration: 1230, Train loss: -0.6399, rewards: 0.6867\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1240, Train loss: -0.6161, rewards: 0.6989\n",
      "Iteration: 1250, Train loss: -0.6532, rewards: 0.6720\n",
      "Iteration: 1260, Train loss: -0.5657, rewards: 0.7137\n",
      "Iteration: 1270, Train loss: -0.6716, rewards: 0.6648\n",
      "Iteration: 1280, Train loss: -0.5868, rewards: 0.7066\n",
      "Iteration: 1290, Train loss: -0.6719, rewards: 0.6598\n",
      "Iteration: 1300, Train loss: -0.5833, rewards: 0.7115\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7792\n",
      "------------------------------------------------------------\n",
      "Iteration: 1310, Train loss: -0.5356, rewards: 0.7146\n",
      "Iteration: 1320, Train loss: -0.6678, rewards: 0.6922\n",
      "Iteration: 1330, Train loss: -0.5759, rewards: 0.7017\n",
      "Iteration: 1340, Train loss: -0.5814, rewards: 0.6706\n",
      "Iteration: 1350, Train loss: -0.5960, rewards: 0.7331\n",
      "Iteration: 1360, Train loss: -0.4990, rewards: 0.7174\n",
      "Iteration: 1370, Train loss: -0.6127, rewards: 0.7078\n",
      "Iteration: 1380, Train loss: -0.6135, rewards: 0.7153\n",
      "Iteration: 1390, Train loss: -0.5956, rewards: 0.7139\n",
      "Iteration: 1400, Train loss: -0.6064, rewards: 0.6869\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7684\n",
      "------------------------------------------------------------\n",
      "Iteration: 1410, Train loss: -0.6495, rewards: 0.6804\n",
      "Iteration: 1420, Train loss: -0.6596, rewards: 0.6582\n",
      "Iteration: 1430, Train loss: -0.6762, rewards: 0.6849\n",
      "Iteration: 1440, Train loss: -0.6011, rewards: 0.7104\n",
      "Iteration: 1450, Train loss: -0.5980, rewards: 0.7080\n",
      "Iteration: 1460, Train loss: -0.6119, rewards: 0.7122\n",
      "Iteration: 1470, Train loss: -0.5948, rewards: 0.7008\n",
      "Iteration: 1480, Train loss: -0.4990, rewards: 0.7365\n",
      "Iteration: 1490, Train loss: -0.5970, rewards: 0.7096\n",
      "Iteration: 1500, Train loss: -0.5782, rewards: 0.6859\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7804\n",
      "------------------------------------------------------------\n",
      "Iteration: 1510, Train loss: -0.6863, rewards: 0.6824\n",
      "Iteration: 1520, Train loss: -0.5411, rewards: 0.6905\n",
      "Iteration: 1530, Train loss: -0.6610, rewards: 0.6848\n",
      "Iteration: 1540, Train loss: -0.5338, rewards: 0.7393\n",
      "Iteration: 1550, Train loss: -0.6492, rewards: 0.6708\n",
      "Iteration: 1560, Train loss: -0.5976, rewards: 0.7132\n",
      "Iteration: 1570, Train loss: -0.5486, rewards: 0.7016\n",
      "Iteration: 1580, Train loss: -0.5723, rewards: 0.7435\n",
      "Iteration: 1590, Train loss: -0.5192, rewards: 0.7340\n",
      "Iteration: 1600, Train loss: -0.5760, rewards: 0.7275\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7874\n",
      "------------------------------------------------------------\n",
      "Iteration: 1610, Train loss: -0.6111, rewards: 0.6813\n",
      "Iteration: 1620, Train loss: -0.5729, rewards: 0.7205\n",
      "Iteration: 1630, Train loss: -0.6187, rewards: 0.7024\n",
      "Iteration: 1640, Train loss: -0.5992, rewards: 0.6927\n",
      "Iteration: 1650, Train loss: -0.5835, rewards: 0.6824\n",
      "Iteration: 1660, Train loss: -0.5725, rewards: 0.6984\n",
      "Iteration: 1670, Train loss: -0.5739, rewards: 0.6898\n",
      "Iteration: 1680, Train loss: -0.6395, rewards: 0.6892\n",
      "Iteration: 1690, Train loss: -0.5684, rewards: 0.7036\n",
      "Iteration: 1700, Train loss: -0.6181, rewards: 0.7174\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7874\n",
      "------------------------------------------------------------\n",
      "Iteration: 1710, Train loss: -0.6131, rewards: 0.7018\n",
      "Iteration: 1720, Train loss: -0.6314, rewards: 0.7144\n",
      "Iteration: 1730, Train loss: -0.4977, rewards: 0.7153\n",
      "Iteration: 1740, Train loss: -0.6251, rewards: 0.6972\n",
      "Iteration: 1750, Train loss: -0.6294, rewards: 0.7240\n",
      "Iteration: 1760, Train loss: -0.5679, rewards: 0.7131\n",
      "Iteration: 1770, Train loss: -0.5636, rewards: 0.7227\n",
      "Iteration: 1780, Train loss: -0.5828, rewards: 0.6995\n",
      "Iteration: 1790, Train loss: -0.6112, rewards: 0.7206\n",
      "Iteration: 1800, Train loss: -0.5823, rewards: 0.6992\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7874\n",
      "------------------------------------------------------------\n",
      "Iteration: 1810, Train loss: -0.6311, rewards: 0.7072\n",
      "Iteration: 1820, Train loss: -0.5282, rewards: 0.6988\n",
      "Iteration: 1830, Train loss: -0.5791, rewards: 0.7067\n",
      "Iteration: 1840, Train loss: -0.6264, rewards: 0.6878\n",
      "Iteration: 1850, Train loss: -0.6136, rewards: 0.6918\n",
      "Iteration: 1860, Train loss: -0.6161, rewards: 0.6862\n",
      "Iteration: 1870, Train loss: -0.6136, rewards: 0.6955\n",
      "Iteration: 1880, Train loss: -0.5841, rewards: 0.6915\n",
      "Iteration: 1890, Train loss: -0.6301, rewards: 0.6709\n",
      "Iteration: 1900, Train loss: -0.6017, rewards: 0.7268\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7809\n",
      "------------------------------------------------------------\n",
      "Iteration: 1910, Train loss: -0.5423, rewards: 0.7356\n",
      "Iteration: 1920, Train loss: -0.4933, rewards: 0.7104\n",
      "Iteration: 1930, Train loss: -0.6440, rewards: 0.6852\n",
      "Iteration: 1940, Train loss: -0.5284, rewards: 0.7298\n",
      "Iteration: 1950, Train loss: -0.5719, rewards: 0.7150\n",
      "Iteration: 1960, Train loss: -0.5072, rewards: 0.7457\n",
      "Iteration: 1970, Train loss: -0.5606, rewards: 0.6875\n",
      "Iteration: 1980, Train loss: -0.5863, rewards: 0.7055\n",
      "Iteration: 1990, Train loss: -0.5920, rewards: 0.7194\n",
      "Iteration: 2000, Train loss: -0.5536, rewards: 0.7229\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7792\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.6250, Hits@3: 0.8393, Hits@10: 0.8750, MRR: 0.7272\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8346938775510205 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-28 23:26:57,938]\u001b[0m Trial 4 finished with value: 0.8346938775510205 and parameters: {'lr': 0.008826998928566232, 'bs': 125, 'b': 0.32150681958726635, 'l': 0.3445807462595228, 'ee': 100}. Best is trial 4 with value: 0.8346938775510205.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.1330, rewards: 0.3185\n",
      "Iteration: 10, Train loss: -0.1078, rewards: 0.4633\n",
      "Iteration: 15, Train loss: -0.4539, rewards: 0.4640\n",
      "Iteration: 20, Train loss: -0.4398, rewards: 0.5325\n",
      "Iteration: 25, Train loss: -0.6021, rewards: 0.5666\n",
      "Iteration: 30, Train loss: -0.4742, rewards: 0.6033\n",
      "Iteration: 35, Train loss: -0.3154, rewards: 0.6404\n",
      "Iteration: 40, Train loss: -0.3689, rewards: 0.6591\n",
      "Iteration: 45, Train loss: -0.2802, rewards: 0.6758\n",
      "Iteration: 50, Train loss: -0.4319, rewards: 0.5297\n",
      "Eval:\n",
      "Hits@1: 0.6495, Hits@3: 0.8041, Hits@10: 0.8247, MRR: 0.7212\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.2800, rewards: 0.5428\n",
      "Iteration: 60, Train loss: -0.2538, rewards: 0.6849\n",
      "Iteration: 65, Train loss: -0.1414, rewards: 0.6501\n",
      "Iteration: 70, Train loss: -0.2675, rewards: 0.7213\n",
      "Iteration: 75, Train loss: -0.1471, rewards: 0.7272\n",
      "Iteration: 80, Train loss: -0.1506, rewards: 0.7310\n",
      "Iteration: 85, Train loss: -0.2639, rewards: 0.6790\n",
      "Iteration: 90, Train loss: -0.2158, rewards: 0.7540\n",
      "Iteration: 95, Train loss: -0.2119, rewards: 0.7328\n",
      "Iteration: 100, Train loss: -0.2379, rewards: 0.6787\n",
      "Eval:\n",
      "Hits@1: 0.7423, Hits@3: 0.7938, Hits@10: 0.8247, MRR: 0.7745\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.2829, rewards: 0.7169\n",
      "Iteration: 110, Train loss: -0.0588, rewards: 0.7537\n",
      "Iteration: 115, Train loss: -0.1420, rewards: 0.7524\n",
      "Iteration: 120, Train loss: -0.1395, rewards: 0.7561\n",
      "Iteration: 125, Train loss: -0.1290, rewards: 0.7158\n",
      "Iteration: 130, Train loss: -0.1711, rewards: 0.6916\n",
      "Iteration: 135, Train loss: -0.2132, rewards: 0.7316\n",
      "Iteration: 140, Train loss: -0.0845, rewards: 0.7490\n",
      "Iteration: 145, Train loss: -0.1662, rewards: 0.7490\n",
      "Iteration: 150, Train loss: -0.3048, rewards: 0.6940\n",
      "Eval:\n",
      "Hits@1: 0.7320, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7686\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.0937, rewards: 0.7336\n",
      "Iteration: 160, Train loss: -0.0919, rewards: 0.7285\n",
      "Iteration: 165, Train loss: -0.1011, rewards: 0.7337\n",
      "Iteration: 170, Train loss: -0.2060, rewards: 0.7607\n",
      "Iteration: 175, Train loss: -0.2031, rewards: 0.7078\n",
      "Iteration: 180, Train loss: -0.2023, rewards: 0.7528\n",
      "Iteration: 185, Train loss: -0.1201, rewards: 0.7106\n",
      "Iteration: 190, Train loss: -0.1539, rewards: 0.6700\n",
      "Iteration: 195, Train loss: -0.1313, rewards: 0.7391\n",
      "Iteration: 200, Train loss: -0.0561, rewards: 0.7346\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7822\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.1278, rewards: 0.7081\n",
      "Iteration: 210, Train loss: -0.2207, rewards: 0.7230\n",
      "Iteration: 215, Train loss: -0.1699, rewards: 0.7596\n",
      "Iteration: 220, Train loss: -0.1459, rewards: 0.7601\n",
      "Iteration: 225, Train loss: -0.1751, rewards: 0.7145\n",
      "Iteration: 230, Train loss: -0.1472, rewards: 0.7193\n",
      "Iteration: 235, Train loss: -0.2189, rewards: 0.6613\n",
      "Iteration: 240, Train loss: -0.1324, rewards: 0.7101\n",
      "Iteration: 245, Train loss: -0.1365, rewards: 0.7539\n",
      "Iteration: 250, Train loss: -0.0989, rewards: 0.7416\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.8144, MRR: 0.7841\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.2104, rewards: 0.7431\n",
      "Iteration: 260, Train loss: -0.1796, rewards: 0.6824\n",
      "Iteration: 265, Train loss: -0.1469, rewards: 0.7421\n",
      "Iteration: 270, Train loss: -0.1856, rewards: 0.7737\n",
      "Iteration: 275, Train loss: -0.2572, rewards: 0.8009\n",
      "Iteration: 280, Train loss: -0.1828, rewards: 0.7694\n",
      "Iteration: 285, Train loss: -0.1854, rewards: 0.7303\n",
      "Iteration: 290, Train loss: -0.1554, rewards: 0.7555\n",
      "Iteration: 295, Train loss: -0.0919, rewards: 0.7539\n",
      "Iteration: 300, Train loss: -0.1211, rewards: 0.7052\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7752\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: -0.1479, rewards: 0.7127\n",
      "Iteration: 310, Train loss: -0.0328, rewards: 0.6988\n",
      "Iteration: 315, Train loss: -0.1383, rewards: 0.7406\n",
      "Iteration: 320, Train loss: -0.2435, rewards: 0.7422\n",
      "Iteration: 325, Train loss: -0.1667, rewards: 0.7501\n",
      "Iteration: 330, Train loss: -0.2017, rewards: 0.7652\n",
      "Iteration: 335, Train loss: -0.1002, rewards: 0.7385\n",
      "Iteration: 340, Train loss: -0.1148, rewards: 0.7746\n",
      "Iteration: 345, Train loss: -0.2286, rewards: 0.7272\n",
      "Iteration: 350, Train loss: -0.1235, rewards: 0.7515\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7938, Hits@10: 0.8041, MRR: 0.7912\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: -0.2071, rewards: 0.7355\n",
      "Iteration: 360, Train loss: -0.1566, rewards: 0.7336\n",
      "Iteration: 365, Train loss: -0.2417, rewards: 0.7624\n",
      "Iteration: 370, Train loss: -0.1820, rewards: 0.7687\n",
      "Iteration: 375, Train loss: -0.2032, rewards: 0.7419\n",
      "Iteration: 380, Train loss: -0.1442, rewards: 0.7200\n",
      "Iteration: 385, Train loss: -0.2354, rewards: 0.7243\n",
      "Iteration: 390, Train loss: -0.0659, rewards: 0.7642\n",
      "Iteration: 395, Train loss: -0.1762, rewards: 0.7418\n",
      "Iteration: 400, Train loss: -0.1796, rewards: 0.7890\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7772\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -0.1107, rewards: 0.7321\n",
      "Iteration: 410, Train loss: -0.0766, rewards: 0.7660\n",
      "Iteration: 415, Train loss: -0.1282, rewards: 0.7222\n",
      "Iteration: 420, Train loss: -0.1554, rewards: 0.7646\n",
      "Iteration: 425, Train loss: -0.1831, rewards: 0.7733\n",
      "Iteration: 430, Train loss: -0.0997, rewards: 0.7815\n",
      "Iteration: 435, Train loss: -0.1075, rewards: 0.7409\n",
      "Iteration: 440, Train loss: -0.1259, rewards: 0.7385\n",
      "Iteration: 445, Train loss: -0.1260, rewards: 0.8113\n",
      "Iteration: 450, Train loss: -0.0509, rewards: 0.7791\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7938, Hits@10: 0.8144, MRR: 0.7916\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: -0.0990, rewards: 0.7639\n",
      "Iteration: 460, Train loss: -0.1531, rewards: 0.7613\n",
      "Iteration: 465, Train loss: -0.1067, rewards: 0.7196\n",
      "Iteration: 470, Train loss: -0.1925, rewards: 0.7687\n",
      "Iteration: 475, Train loss: -0.0804, rewards: 0.7525\n",
      "Iteration: 480, Train loss: -0.0656, rewards: 0.7587\n",
      "Iteration: 485, Train loss: -0.1814, rewards: 0.7193\n",
      "Iteration: 490, Train loss: -0.1630, rewards: 0.6904\n",
      "Iteration: 495, Train loss: -0.0762, rewards: 0.6915\n",
      "Iteration: 500, Train loss: -0.2770, rewards: 0.6991\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7938, Hits@10: 0.8144, MRR: 0.7813\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: -0.1618, rewards: 0.6969\n",
      "Iteration: 510, Train loss: -0.1208, rewards: 0.7246\n",
      "Iteration: 515, Train loss: -0.2011, rewards: 0.7576\n",
      "Iteration: 520, Train loss: -0.1964, rewards: 0.7915\n",
      "Iteration: 525, Train loss: -0.1570, rewards: 0.7887\n",
      "Iteration: 530, Train loss: -0.1484, rewards: 0.7675\n",
      "Iteration: 535, Train loss: -0.1377, rewards: 0.7590\n",
      "Iteration: 540, Train loss: -0.1686, rewards: 0.7637\n",
      "Iteration: 545, Train loss: -0.1591, rewards: 0.7503\n",
      "Iteration: 550, Train loss: -0.2063, rewards: 0.7943\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7938, Hits@10: 0.8144, MRR: 0.7751\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: -0.1856, rewards: 0.7937\n",
      "Iteration: 560, Train loss: -0.0807, rewards: 0.7904\n",
      "Iteration: 565, Train loss: -0.1608, rewards: 0.7616\n",
      "Iteration: 570, Train loss: -0.0672, rewards: 0.7436\n",
      "Iteration: 575, Train loss: -0.1953, rewards: 0.7401\n",
      "Iteration: 580, Train loss: -0.1254, rewards: 0.7834\n",
      "Iteration: 585, Train loss: -0.1822, rewards: 0.7360\n",
      "Iteration: 590, Train loss: -0.1483, rewards: 0.7379\n",
      "Iteration: 595, Train loss: -0.1529, rewards: 0.7493\n",
      "Iteration: 600, Train loss: -0.1747, rewards: 0.7840\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7732, Hits@10: 0.7938, MRR: 0.7718\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -0.2753, rewards: 0.7799\n",
      "Iteration: 610, Train loss: -0.2722, rewards: 0.7412\n",
      "Iteration: 615, Train loss: -0.1888, rewards: 0.7924\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 620, Train loss: -0.2143, rewards: 0.7481\n",
      "Iteration: 625, Train loss: -0.2175, rewards: 0.7470\n",
      "Iteration: 630, Train loss: -0.1943, rewards: 0.7618\n",
      "Iteration: 635, Train loss: -0.1392, rewards: 0.7693\n",
      "Iteration: 640, Train loss: -0.1754, rewards: 0.7572\n",
      "Iteration: 645, Train loss: -0.1976, rewards: 0.7593\n",
      "Iteration: 650, Train loss: -0.0898, rewards: 0.7888\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7938, Hits@10: 0.7938, MRR: 0.7835\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: -0.1533, rewards: 0.7478\n",
      "Iteration: 660, Train loss: -0.1795, rewards: 0.7425\n",
      "Iteration: 665, Train loss: -0.1281, rewards: 0.7394\n",
      "Iteration: 670, Train loss: -0.2166, rewards: 0.5887\n",
      "Iteration: 675, Train loss: -0.0094, rewards: 0.7016\n",
      "Iteration: 680, Train loss: -0.0091, rewards: 0.7221\n",
      "Iteration: 685, Train loss: -0.1320, rewards: 0.7740\n",
      "Iteration: 690, Train loss: -0.1501, rewards: 0.6973\n",
      "Iteration: 695, Train loss: -0.1393, rewards: 0.7470\n",
      "Iteration: 700, Train loss: -0.1590, rewards: 0.7130\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7732\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: -0.1383, rewards: 0.7593\n",
      "Iteration: 710, Train loss: -0.1846, rewards: 0.7336\n",
      "Iteration: 715, Train loss: -0.0917, rewards: 0.7184\n",
      "Iteration: 720, Train loss: -0.2280, rewards: 0.7325\n",
      "Iteration: 725, Train loss: -0.1655, rewards: 0.7431\n",
      "Iteration: 730, Train loss: -0.1121, rewards: 0.7718\n",
      "Iteration: 735, Train loss: -0.1294, rewards: 0.7746\n",
      "Iteration: 740, Train loss: -0.1113, rewards: 0.8109\n",
      "Iteration: 745, Train loss: -0.1489, rewards: 0.7394\n",
      "Iteration: 750, Train loss: -0.2081, rewards: 0.7500\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7710\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.1534, rewards: 0.7739\n",
      "Iteration: 760, Train loss: -0.1527, rewards: 0.7803\n",
      "Iteration: 765, Train loss: -0.0948, rewards: 0.7613\n",
      "Iteration: 770, Train loss: -0.1860, rewards: 0.7636\n",
      "Iteration: 775, Train loss: -0.1966, rewards: 0.7301\n",
      "Iteration: 780, Train loss: -0.1565, rewards: 0.7657\n",
      "Iteration: 785, Train loss: -0.1798, rewards: 0.7481\n",
      "Iteration: 790, Train loss: -0.2454, rewards: 0.7396\n",
      "Iteration: 795, Train loss: -0.1987, rewards: 0.7716\n",
      "Iteration: 800, Train loss: -0.1087, rewards: 0.7978\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7784\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: -0.0606, rewards: 0.8130\n",
      "Iteration: 810, Train loss: -0.0910, rewards: 0.7713\n",
      "Iteration: 815, Train loss: -0.1326, rewards: 0.7491\n",
      "Iteration: 820, Train loss: -0.1049, rewards: 0.7301\n",
      "Iteration: 825, Train loss: -0.1854, rewards: 0.7778\n",
      "Iteration: 830, Train loss: -0.1625, rewards: 0.7473\n",
      "Iteration: 835, Train loss: -0.2017, rewards: 0.7876\n",
      "Iteration: 840, Train loss: -0.1302, rewards: 0.7525\n",
      "Iteration: 845, Train loss: -0.1352, rewards: 0.7445\n",
      "Iteration: 850, Train loss: -0.1741, rewards: 0.7790\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7732, Hits@10: 0.7835, MRR: 0.7706\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: -0.1553, rewards: 0.7928\n",
      "Iteration: 860, Train loss: -0.1417, rewards: 0.7955\n",
      "Iteration: 865, Train loss: -0.1841, rewards: 0.7782\n",
      "Iteration: 870, Train loss: -0.1797, rewards: 0.7884\n",
      "Iteration: 875, Train loss: -0.1674, rewards: 0.7407\n",
      "Iteration: 880, Train loss: -0.1821, rewards: 0.7839\n",
      "Iteration: 885, Train loss: -0.1780, rewards: 0.8018\n",
      "Iteration: 890, Train loss: -0.2014, rewards: 0.7467\n",
      "Iteration: 895, Train loss: -0.1811, rewards: 0.7882\n",
      "Iteration: 900, Train loss: -0.1927, rewards: 0.7503\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7784\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: -0.1861, rewards: 0.7513\n",
      "Iteration: 910, Train loss: -0.2468, rewards: 0.7576\n",
      "Iteration: 915, Train loss: -0.1460, rewards: 0.7663\n",
      "Iteration: 920, Train loss: -0.1170, rewards: 0.7715\n",
      "Iteration: 925, Train loss: -0.1564, rewards: 0.7582\n",
      "Iteration: 930, Train loss: -0.1330, rewards: 0.7699\n",
      "Iteration: 935, Train loss: -0.1405, rewards: 0.7728\n",
      "Iteration: 940, Train loss: -0.2164, rewards: 0.7496\n",
      "Iteration: 945, Train loss: -0.2143, rewards: 0.7610\n",
      "Iteration: 950, Train loss: -0.1907, rewards: 0.7633\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7732\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: -0.1568, rewards: 0.7948\n",
      "Iteration: 960, Train loss: -0.1907, rewards: 0.7818\n",
      "Iteration: 965, Train loss: -0.2081, rewards: 0.8090\n",
      "Iteration: 970, Train loss: -0.1972, rewards: 0.7848\n",
      "Iteration: 975, Train loss: -0.1744, rewards: 0.7578\n",
      "Iteration: 980, Train loss: -0.2024, rewards: 0.7812\n",
      "Iteration: 985, Train loss: -0.1406, rewards: 0.7899\n",
      "Iteration: 990, Train loss: -0.1412, rewards: 0.7761\n",
      "Iteration: 995, Train loss: -0.1257, rewards: 0.7521\n",
      "Iteration: 1000, Train loss: -0.1925, rewards: 0.7710\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7784\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: -0.1488, rewards: 0.7822\n",
      "Iteration: 1010, Train loss: -0.1568, rewards: 0.7493\n",
      "Iteration: 1015, Train loss: -0.2643, rewards: 0.7428\n",
      "Iteration: 1020, Train loss: -0.1690, rewards: 0.7328\n",
      "Iteration: 1025, Train loss: -0.1869, rewards: 0.7248\n",
      "Iteration: 1030, Train loss: -0.1896, rewards: 0.7291\n",
      "Iteration: 1035, Train loss: -0.2017, rewards: 0.7707\n",
      "Iteration: 1040, Train loss: -0.1359, rewards: 0.7348\n",
      "Iteration: 1045, Train loss: -0.1710, rewards: 0.7701\n",
      "Iteration: 1050, Train loss: -0.0473, rewards: 0.7640\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7861\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -0.1834, rewards: 0.7476\n",
      "Iteration: 1060, Train loss: -0.1985, rewards: 0.7903\n",
      "Iteration: 1065, Train loss: -0.2195, rewards: 0.7522\n",
      "Iteration: 1070, Train loss: -0.1847, rewards: 0.7675\n",
      "Iteration: 1075, Train loss: -0.1396, rewards: 0.7697\n",
      "Iteration: 1080, Train loss: -0.2124, rewards: 0.7604\n",
      "Iteration: 1085, Train loss: -0.2401, rewards: 0.7696\n",
      "Iteration: 1090, Train loss: -0.1620, rewards: 0.7755\n",
      "Iteration: 1095, Train loss: -0.1741, rewards: 0.7634\n",
      "Iteration: 1100, Train loss: -0.1610, rewards: 0.7751\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7784\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.1979, rewards: 0.8088\n",
      "Iteration: 1110, Train loss: -0.1626, rewards: 0.7779\n",
      "Iteration: 1115, Train loss: -0.1273, rewards: 0.7852\n",
      "Iteration: 1120, Train loss: -0.1580, rewards: 0.7945\n",
      "Iteration: 1125, Train loss: -0.1728, rewards: 0.7440\n",
      "Iteration: 1130, Train loss: -0.2689, rewards: 0.7928\n",
      "Iteration: 1135, Train loss: -0.1739, rewards: 0.7593\n",
      "Iteration: 1140, Train loss: -0.1484, rewards: 0.7615\n",
      "Iteration: 1145, Train loss: -0.1545, rewards: 0.7351\n",
      "Iteration: 1150, Train loss: -0.0988, rewards: 0.7818\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7784\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: -0.2751, rewards: 0.7673\n",
      "Iteration: 1160, Train loss: -0.1178, rewards: 0.7201\n",
      "Iteration: 1165, Train loss: -0.2308, rewards: 0.7451\n",
      "Iteration: 1170, Train loss: -0.2074, rewards: 0.7836\n",
      "Iteration: 1175, Train loss: -0.1229, rewards: 0.7633\n",
      "Iteration: 1180, Train loss: -0.2102, rewards: 0.7845\n",
      "Iteration: 1185, Train loss: -0.0818, rewards: 0.7110\n",
      "Iteration: 1190, Train loss: -0.0953, rewards: 0.7772\n",
      "Iteration: 1195, Train loss: -0.1275, rewards: 0.8096\n",
      "Iteration: 1200, Train loss: -0.1833, rewards: 0.8142\n",
      "Eval:\n",
      "Hits@1: 0.7732, Hits@3: 0.7938, Hits@10: 0.7938, MRR: 0.7818\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: -0.2109, rewards: 0.7925\n",
      "Iteration: 1210, Train loss: -0.1721, rewards: 0.7967\n",
      "Iteration: 1215, Train loss: -0.1646, rewards: 0.7785\n",
      "Iteration: 1220, Train loss: -0.1444, rewards: 0.7531\n",
      "Iteration: 1225, Train loss: -0.1135, rewards: 0.8082\n",
      "Iteration: 1230, Train loss: -0.1629, rewards: 0.7055\n",
      "Iteration: 1235, Train loss: -0.1749, rewards: 0.7803\n",
      "Iteration: 1240, Train loss: -0.1253, rewards: 0.7557\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1245, Train loss: -0.1966, rewards: 0.7896\n",
      "Iteration: 1250, Train loss: -0.2444, rewards: 0.8261\n",
      "Eval:\n",
      "Hits@1: 0.7938, Hits@3: 0.7938, Hits@10: 0.7938, MRR: 0.7938\n",
      "------------------------------------------------------------\n",
      "Iteration: 1255, Train loss: -0.1925, rewards: 0.8075\n",
      "Iteration: 1260, Train loss: -0.0567, rewards: 0.7913\n",
      "Iteration: 1265, Train loss: -0.1290, rewards: 0.7739\n",
      "Iteration: 1270, Train loss: -0.1985, rewards: 0.7225\n",
      "Iteration: 1275, Train loss: -0.2204, rewards: 0.7639\n",
      "Iteration: 1280, Train loss: -0.1560, rewards: 0.7618\n",
      "Iteration: 1285, Train loss: -0.2216, rewards: 0.7821\n",
      "Iteration: 1290, Train loss: -0.1083, rewards: 0.7625\n",
      "Iteration: 1295, Train loss: -0.1606, rewards: 0.7616\n",
      "Iteration: 1300, Train loss: -0.2020, rewards: 0.7778\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7938, Hits@10: 0.7938, MRR: 0.7887\n",
      "------------------------------------------------------------\n",
      "Iteration: 1305, Train loss: -0.1380, rewards: 0.7612\n",
      "Iteration: 1310, Train loss: -0.2296, rewards: 0.7910\n",
      "Iteration: 1315, Train loss: -0.2199, rewards: 0.8400\n",
      "Iteration: 1320, Train loss: -0.1724, rewards: 0.7691\n",
      "Iteration: 1325, Train loss: -0.1697, rewards: 0.7260\n",
      "Iteration: 1330, Train loss: -0.1972, rewards: 0.7546\n",
      "Iteration: 1335, Train loss: -0.2102, rewards: 0.7873\n",
      "Iteration: 1340, Train loss: -0.1463, rewards: 0.7709\n",
      "Iteration: 1345, Train loss: -0.1806, rewards: 0.7518\n",
      "Iteration: 1350, Train loss: -0.1388, rewards: 0.7130\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7727\n",
      "------------------------------------------------------------\n",
      "Iteration: 1355, Train loss: -0.1848, rewards: 0.7407\n",
      "Iteration: 1360, Train loss: -0.1996, rewards: 0.7236\n",
      "Iteration: 1365, Train loss: -0.2675, rewards: 0.7351\n",
      "Iteration: 1370, Train loss: -0.1617, rewards: 0.7397\n",
      "Iteration: 1375, Train loss: -0.1312, rewards: 0.7604\n",
      "Iteration: 1380, Train loss: -0.1589, rewards: 0.7425\n",
      "Iteration: 1385, Train loss: -0.2203, rewards: 0.7600\n",
      "Iteration: 1390, Train loss: -0.0975, rewards: 0.7166\n",
      "Iteration: 1395, Train loss: -0.1097, rewards: 0.7487\n",
      "Iteration: 1400, Train loss: -0.3002, rewards: 0.8057\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7758\n",
      "------------------------------------------------------------\n",
      "Iteration: 1405, Train loss: -0.1330, rewards: 0.7582\n",
      "Iteration: 1410, Train loss: -0.0962, rewards: 0.7539\n",
      "Iteration: 1415, Train loss: -0.2250, rewards: 0.7725\n",
      "Iteration: 1420, Train loss: -0.2110, rewards: 0.7385\n",
      "Iteration: 1425, Train loss: -0.2485, rewards: 0.7390\n",
      "Iteration: 1430, Train loss: -0.1481, rewards: 0.7248\n",
      "Iteration: 1435, Train loss: -0.1597, rewards: 0.7563\n",
      "Iteration: 1440, Train loss: -0.1331, rewards: 0.7454\n",
      "Iteration: 1445, Train loss: -0.1511, rewards: 0.7363\n",
      "Iteration: 1450, Train loss: -0.1306, rewards: 0.7539\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.8041, MRR: 0.7771\n",
      "------------------------------------------------------------\n",
      "Iteration: 1455, Train loss: -0.2298, rewards: 0.7440\n",
      "Iteration: 1460, Train loss: -0.2054, rewards: 0.7393\n",
      "Iteration: 1465, Train loss: -0.1841, rewards: 0.7487\n",
      "Iteration: 1470, Train loss: -0.1730, rewards: 0.7719\n",
      "Iteration: 1475, Train loss: -0.1371, rewards: 0.7394\n",
      "Iteration: 1480, Train loss: -0.1671, rewards: 0.7669\n",
      "Iteration: 1485, Train loss: -0.2063, rewards: 0.7612\n",
      "Iteration: 1490, Train loss: -0.1743, rewards: 0.7624\n",
      "Iteration: 1495, Train loss: -0.1617, rewards: 0.7658\n",
      "Iteration: 1500, Train loss: -0.1444, rewards: 0.7540\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7758\n",
      "------------------------------------------------------------\n",
      "Iteration: 1505, Train loss: -0.1131, rewards: 0.7757\n",
      "Iteration: 1510, Train loss: -0.1826, rewards: 0.7367\n",
      "Iteration: 1515, Train loss: -0.1286, rewards: 0.7424\n",
      "Iteration: 1520, Train loss: -0.1711, rewards: 0.7712\n",
      "Iteration: 1525, Train loss: -0.1397, rewards: 0.7418\n",
      "Iteration: 1530, Train loss: -0.2476, rewards: 0.7572\n",
      "Iteration: 1535, Train loss: -0.1728, rewards: 0.8049\n",
      "Iteration: 1540, Train loss: -0.2261, rewards: 0.8049\n",
      "Iteration: 1545, Train loss: -0.1942, rewards: 0.7863\n",
      "Iteration: 1550, Train loss: -0.2027, rewards: 0.7585\n",
      "Eval:\n",
      "Hits@1: 0.7835, Hits@3: 0.7938, Hits@10: 0.8041, MRR: 0.7912\n",
      "------------------------------------------------------------\n",
      "Iteration: 1555, Train loss: -0.1879, rewards: 0.7972\n",
      "Iteration: 1560, Train loss: -0.2216, rewards: 0.7904\n",
      "Iteration: 1565, Train loss: -0.1675, rewards: 0.7434\n",
      "Iteration: 1570, Train loss: -0.1300, rewards: 0.7846\n",
      "Iteration: 1575, Train loss: -0.2475, rewards: 0.7546\n",
      "Iteration: 1580, Train loss: -0.1096, rewards: 0.7390\n",
      "Iteration: 1585, Train loss: -0.1804, rewards: 0.7667\n",
      "Iteration: 1590, Train loss: -0.1513, rewards: 0.7333\n",
      "Iteration: 1595, Train loss: -0.1621, rewards: 0.7697\n",
      "Iteration: 1600, Train loss: -0.1480, rewards: 0.7776\n",
      "Eval:\n",
      "Hits@1: 0.7320, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7586\n",
      "------------------------------------------------------------\n",
      "Iteration: 1605, Train loss: -0.1373, rewards: 0.7522\n",
      "Iteration: 1610, Train loss: -0.1983, rewards: 0.7801\n",
      "Iteration: 1615, Train loss: -0.1539, rewards: 0.7901\n",
      "Iteration: 1620, Train loss: -0.1825, rewards: 0.7451\n",
      "Iteration: 1625, Train loss: -0.2793, rewards: 0.7612\n",
      "Iteration: 1630, Train loss: -0.1290, rewards: 0.7806\n",
      "Iteration: 1635, Train loss: -0.1592, rewards: 0.7500\n",
      "Iteration: 1640, Train loss: -0.1350, rewards: 0.7699\n",
      "Iteration: 1645, Train loss: -0.1236, rewards: 0.7279\n",
      "Iteration: 1650, Train loss: -0.1560, rewards: 0.7978\n",
      "Eval:\n",
      "Hits@1: 0.7423, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7637\n",
      "------------------------------------------------------------\n",
      "Iteration: 1655, Train loss: -0.0987, rewards: 0.7287\n",
      "Iteration: 1660, Train loss: -0.1505, rewards: 0.7379\n",
      "Iteration: 1665, Train loss: -0.1330, rewards: 0.7548\n",
      "Iteration: 1670, Train loss: -0.1978, rewards: 0.7509\n",
      "Iteration: 1675, Train loss: -0.2018, rewards: 0.7290\n",
      "Iteration: 1680, Train loss: -0.2487, rewards: 0.7825\n",
      "Iteration: 1685, Train loss: -0.1481, rewards: 0.7834\n",
      "Iteration: 1690, Train loss: -0.1569, rewards: 0.7957\n",
      "Iteration: 1695, Train loss: -0.2124, rewards: 0.7610\n",
      "Iteration: 1700, Train loss: -0.1818, rewards: 0.7358\n",
      "Eval:\n",
      "Hits@1: 0.7423, Hits@3: 0.7732, Hits@10: 0.7938, MRR: 0.7607\n",
      "------------------------------------------------------------\n",
      "Iteration: 1705, Train loss: -0.1458, rewards: 0.7691\n",
      "Iteration: 1710, Train loss: -0.1448, rewards: 0.7349\n",
      "Iteration: 1715, Train loss: -0.1566, rewards: 0.7936\n",
      "Iteration: 1720, Train loss: -0.2068, rewards: 0.7351\n",
      "Iteration: 1725, Train loss: -0.2016, rewards: 0.7685\n",
      "Iteration: 1730, Train loss: -0.1820, rewards: 0.7496\n",
      "Iteration: 1735, Train loss: -0.1375, rewards: 0.7766\n",
      "Iteration: 1740, Train loss: -0.1239, rewards: 0.7675\n",
      "Iteration: 1745, Train loss: -0.1168, rewards: 0.7490\n",
      "Iteration: 1750, Train loss: -0.1556, rewards: 0.7927\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7835, MRR: 0.7646\n",
      "------------------------------------------------------------\n",
      "Iteration: 1755, Train loss: -0.2020, rewards: 0.7793\n",
      "Iteration: 1760, Train loss: -0.2366, rewards: 0.7724\n",
      "Iteration: 1765, Train loss: -0.2694, rewards: 0.7840\n",
      "Iteration: 1770, Train loss: -0.1199, rewards: 0.7988\n",
      "Iteration: 1775, Train loss: -0.1458, rewards: 0.7787\n",
      "Iteration: 1780, Train loss: -0.1835, rewards: 0.7690\n",
      "Iteration: 1785, Train loss: -0.2410, rewards: 0.8061\n",
      "Iteration: 1790, Train loss: -0.1415, rewards: 0.7482\n",
      "Iteration: 1795, Train loss: -0.1612, rewards: 0.7860\n",
      "Iteration: 1800, Train loss: -0.1422, rewards: 0.7803\n",
      "Eval:\n",
      "Hits@1: 0.7629, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7758\n",
      "------------------------------------------------------------\n",
      "Iteration: 1805, Train loss: -0.2055, rewards: 0.7566\n",
      "Iteration: 1810, Train loss: -0.0931, rewards: 0.7831\n",
      "Iteration: 1815, Train loss: -0.1581, rewards: 0.7657\n",
      "Iteration: 1820, Train loss: -0.1254, rewards: 0.7678\n",
      "Iteration: 1825, Train loss: -0.2537, rewards: 0.7939\n",
      "Iteration: 1830, Train loss: -0.1082, rewards: 0.7399\n",
      "Iteration: 1835, Train loss: -0.1745, rewards: 0.7651\n",
      "Iteration: 1840, Train loss: -0.2012, rewards: 0.7919\n",
      "Iteration: 1845, Train loss: -0.2324, rewards: 0.7846\n",
      "Iteration: 1850, Train loss: -0.1153, rewards: 0.7563\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7835, Hits@10: 0.7938, MRR: 0.7682\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1855, Train loss: -0.2331, rewards: 0.7755\n",
      "Iteration: 1860, Train loss: -0.2307, rewards: 0.8104\n",
      "Iteration: 1865, Train loss: -0.1825, rewards: 0.7876\n",
      "Iteration: 1870, Train loss: -0.1626, rewards: 0.7873\n",
      "Iteration: 1875, Train loss: -0.1443, rewards: 0.7606\n",
      "Iteration: 1880, Train loss: -0.1221, rewards: 0.7631\n",
      "Iteration: 1885, Train loss: -0.1626, rewards: 0.7685\n",
      "Iteration: 1890, Train loss: -0.1316, rewards: 0.7815\n",
      "Iteration: 1895, Train loss: -0.2350, rewards: 0.7737\n",
      "Iteration: 1900, Train loss: -0.1458, rewards: 0.7713\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7732, Hits@10: 0.7835, MRR: 0.7620\n",
      "------------------------------------------------------------\n",
      "Iteration: 1905, Train loss: -0.1667, rewards: 0.7657\n",
      "Iteration: 1910, Train loss: -0.1917, rewards: 0.7801\n",
      "Iteration: 1915, Train loss: -0.1608, rewards: 0.7590\n",
      "Iteration: 1920, Train loss: -0.1601, rewards: 0.7661\n",
      "Iteration: 1925, Train loss: -0.1743, rewards: 0.7828\n",
      "Iteration: 1930, Train loss: -0.2075, rewards: 0.7778\n",
      "Iteration: 1935, Train loss: -0.1715, rewards: 0.7613\n",
      "Iteration: 1940, Train loss: -0.1935, rewards: 0.7645\n",
      "Iteration: 1945, Train loss: -0.1372, rewards: 0.7506\n",
      "Iteration: 1950, Train loss: -0.2297, rewards: 0.7640\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7732, Hits@10: 0.7938, MRR: 0.7646\n",
      "------------------------------------------------------------\n",
      "Iteration: 1955, Train loss: -0.1559, rewards: 0.7922\n",
      "Iteration: 1960, Train loss: -0.1075, rewards: 0.7521\n",
      "Iteration: 1965, Train loss: -0.1652, rewards: 0.7515\n",
      "Iteration: 1970, Train loss: -0.1350, rewards: 0.7507\n",
      "Iteration: 1975, Train loss: -0.2734, rewards: 0.7831\n",
      "Iteration: 1980, Train loss: -0.1727, rewards: 0.7545\n",
      "Iteration: 1985, Train loss: -0.1730, rewards: 0.8096\n",
      "Iteration: 1990, Train loss: -0.1762, rewards: 0.7533\n",
      "Iteration: 1995, Train loss: -0.1308, rewards: 0.8027\n",
      "Iteration: 2000, Train loss: -0.2048, rewards: 0.8046\n",
      "Eval:\n",
      "Hits@1: 0.7526, Hits@3: 0.7732, Hits@10: 0.7835, MRR: 0.7649\n",
      "------------------------------------------------------------\n",
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "INFO:root:[ printing paths at ./outputs_nell995-1/teamplayssport//test_beam/ ]\n",
      "Hits@1: 0.6518, Hits@3: 0.8839, Hits@10: 0.8929, MRR: 0.7577\n",
      "TeamPlaysSport\n",
      "MINERVA MAP: 0.8584183673469388 (112 queries evaluated)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\u001b[32m[I 2023-03-29 00:10:53,568]\u001b[0m Trial 5 finished with value: 0.8584183673469388 and parameters: {'lr': 0.0038722734103131522, 'bs': 67, 'b': 0.20477733478874321, 'l': 0.37137155998946036, 'ee': 50}. Best is trial 5 with value: 0.8584183673469388.\u001b[0m\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Reading vocab...\n",
      "batcher loaded\n",
      "KG constructed\n",
      "Agent start learning ...\n",
      "Iteration: 5, Train loss: -0.0568, rewards: 0.1323\n",
      "Iteration: 10, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 15, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 20, Train loss: -0.0008, rewards: 0.0000\n",
      "Iteration: 25, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 30, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 35, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 40, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 45, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 50, Train loss: -0.0002, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0515, MRR: 0.0109\n",
      "------------------------------------------------------------\n",
      "Iteration: 55, Train loss: -0.0001, rewards: 0.0057\n",
      "Iteration: 60, Train loss: -0.0001, rewards: 0.0000\n",
      "Iteration: 65, Train loss: -0.0003, rewards: 0.0000\n",
      "Iteration: 70, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 75, Train loss: -0.0010, rewards: 0.0000\n",
      "Iteration: 80, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 85, Train loss: 0.0071, rewards: 0.0020\n",
      "Iteration: 90, Train loss: -0.0012, rewards: 0.0000\n",
      "Iteration: 95, Train loss: -0.0023, rewards: 0.0443\n",
      "Iteration: 100, Train loss: -0.0003, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0103, Hits@10: 0.0206, MRR: 0.0082\n",
      "------------------------------------------------------------\n",
      "Iteration: 105, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 110, Train loss: -0.0000, rewards: 0.0000\n",
      "Iteration: 115, Train loss: -0.0002, rewards: 0.0000\n",
      "Iteration: 120, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 125, Train loss: -0.0005, rewards: 0.0000\n",
      "Iteration: 130, Train loss: -0.0004, rewards: 0.0000\n",
      "Iteration: 135, Train loss: -0.0017, rewards: 0.0000\n",
      "Iteration: 140, Train loss: -0.0027, rewards: 0.0000\n",
      "Iteration: 145, Train loss: -0.0034, rewards: 0.0000\n",
      "Iteration: 150, Train loss: -0.0040, rewards: 0.0000\n",
      "Eval:\n",
      "Hits@1: 0.0000, Hits@3: 0.0000, Hits@10: 0.0000, MRR: 0.0000\n",
      "------------------------------------------------------------\n",
      "Iteration: 155, Train loss: -0.0117, rewards: 0.0000\n",
      "Iteration: 160, Train loss: -0.0469, rewards: 0.0009\n",
      "Iteration: 165, Train loss: -0.0330, rewards: 0.1294\n",
      "Iteration: 170, Train loss: -0.0008, rewards: 0.3466\n",
      "Iteration: 175, Train loss: -0.0201, rewards: 0.5391\n",
      "Iteration: 180, Train loss: 0.0004, rewards: 0.5960\n",
      "Iteration: 185, Train loss: -0.0130, rewards: 0.5711\n",
      "Iteration: 190, Train loss: -0.0160, rewards: 0.6646\n",
      "Iteration: 195, Train loss: -0.0090, rewards: 0.6697\n",
      "Iteration: 200, Train loss: -0.0008, rewards: 0.6166\n",
      "Eval:\n",
      "Hits@1: 0.6495, Hits@3: 0.7732, Hits@10: 0.8454, MRR: 0.7199\n",
      "------------------------------------------------------------\n",
      "Iteration: 205, Train loss: -0.0061, rewards: 0.6086\n",
      "Iteration: 210, Train loss: -0.0094, rewards: 0.7043\n",
      "Iteration: 215, Train loss: -0.0063, rewards: 0.6211\n",
      "Iteration: 220, Train loss: -0.0085, rewards: 0.6303\n",
      "Iteration: 225, Train loss: -0.0024, rewards: 0.7060\n",
      "Iteration: 230, Train loss: 0.0027, rewards: 0.7309\n",
      "Iteration: 235, Train loss: 0.0020, rewards: 0.7240\n",
      "Iteration: 240, Train loss: 0.0175, rewards: 0.7011\n",
      "Iteration: 245, Train loss: -0.0045, rewards: 0.6951\n",
      "Iteration: 250, Train loss: -0.0111, rewards: 0.7246\n",
      "Eval:\n",
      "Hits@1: 0.5876, Hits@3: 0.7629, Hits@10: 0.8454, MRR: 0.6802\n",
      "------------------------------------------------------------\n",
      "Iteration: 255, Train loss: -0.0053, rewards: 0.6686\n",
      "Iteration: 260, Train loss: 0.0055, rewards: 0.6663\n",
      "Iteration: 265, Train loss: -0.0177, rewards: 0.6657\n",
      "Iteration: 270, Train loss: 0.0088, rewards: 0.7066\n",
      "Iteration: 275, Train loss: 0.0101, rewards: 0.6743\n",
      "Iteration: 280, Train loss: 0.0033, rewards: 0.6763\n",
      "Iteration: 285, Train loss: 0.0020, rewards: 0.7137\n",
      "Iteration: 290, Train loss: 0.0127, rewards: 0.5991\n",
      "Iteration: 295, Train loss: -0.0106, rewards: 0.6591\n",
      "Iteration: 300, Train loss: -0.0005, rewards: 0.6554\n",
      "Eval:\n",
      "Hits@1: 0.6701, Hits@3: 0.8144, Hits@10: 0.8351, MRR: 0.7371\n",
      "------------------------------------------------------------\n",
      "Iteration: 305, Train loss: 0.0043, rewards: 0.6511\n",
      "Iteration: 310, Train loss: 0.0006, rewards: 0.6383\n",
      "Iteration: 315, Train loss: 0.0070, rewards: 0.6917\n",
      "Iteration: 320, Train loss: 0.0131, rewards: 0.6403\n",
      "Iteration: 325, Train loss: 0.0099, rewards: 0.6360\n",
      "Iteration: 330, Train loss: -0.0058, rewards: 0.6806\n",
      "Iteration: 335, Train loss: 0.0114, rewards: 0.7237\n",
      "Iteration: 340, Train loss: 0.0096, rewards: 0.6689\n",
      "Iteration: 345, Train loss: 0.0114, rewards: 0.7257\n",
      "Iteration: 350, Train loss: 0.0096, rewards: 0.7677\n",
      "Eval:\n",
      "Hits@1: 0.6082, Hits@3: 0.8041, Hits@10: 0.8351, MRR: 0.7003\n",
      "------------------------------------------------------------\n",
      "Iteration: 355, Train loss: 0.0015, rewards: 0.7157\n",
      "Iteration: 360, Train loss: 0.0223, rewards: 0.6780\n",
      "Iteration: 365, Train loss: 0.0089, rewards: 0.6934\n",
      "Iteration: 370, Train loss: -0.0000, rewards: 0.7257\n",
      "Iteration: 375, Train loss: 0.0130, rewards: 0.6771\n",
      "Iteration: 380, Train loss: 0.0081, rewards: 0.6923\n",
      "Iteration: 385, Train loss: 0.0068, rewards: 0.6689\n",
      "Iteration: 390, Train loss: 0.0019, rewards: 0.6854\n",
      "Iteration: 395, Train loss: 0.0105, rewards: 0.6514\n",
      "Iteration: 400, Train loss: 0.0213, rewards: 0.7337\n",
      "Eval:\n",
      "Hits@1: 0.6289, Hits@3: 0.7732, Hits@10: 0.8454, MRR: 0.7128\n",
      "------------------------------------------------------------\n",
      "Iteration: 405, Train loss: -0.0034, rewards: 0.7054\n",
      "Iteration: 410, Train loss: 0.0137, rewards: 0.6823\n",
      "Iteration: 415, Train loss: 0.0045, rewards: 0.7109\n",
      "Iteration: 420, Train loss: -0.0007, rewards: 0.7706\n",
      "Iteration: 425, Train loss: 0.0005, rewards: 0.7143\n",
      "Iteration: 430, Train loss: 0.0079, rewards: 0.6834\n",
      "Iteration: 435, Train loss: 0.0020, rewards: 0.7471\n",
      "Iteration: 440, Train loss: 0.0112, rewards: 0.7194\n",
      "Iteration: 445, Train loss: 0.0156, rewards: 0.7543\n",
      "Iteration: 450, Train loss: 0.0187, rewards: 0.7200\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8454, MRR: 0.7495\n",
      "------------------------------------------------------------\n",
      "Iteration: 455, Train loss: 0.0149, rewards: 0.6914\n",
      "Iteration: 460, Train loss: 0.0129, rewards: 0.7086\n",
      "Iteration: 465, Train loss: -0.0008, rewards: 0.7146\n",
      "Iteration: 470, Train loss: 0.0143, rewards: 0.7086\n",
      "Iteration: 475, Train loss: 0.0094, rewards: 0.7457\n",
      "Iteration: 480, Train loss: 0.0003, rewards: 0.7417\n",
      "Iteration: 485, Train loss: 0.0045, rewards: 0.7143\n",
      "Iteration: 490, Train loss: -0.0077, rewards: 0.7183\n",
      "Iteration: 495, Train loss: 0.0058, rewards: 0.7720\n",
      "Iteration: 500, Train loss: 0.0066, rewards: 0.6743\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7835, Hits@10: 0.8454, MRR: 0.7435\n",
      "------------------------------------------------------------\n",
      "Iteration: 505, Train loss: 0.0067, rewards: 0.7483\n",
      "Iteration: 510, Train loss: 0.0232, rewards: 0.7140\n",
      "Iteration: 515, Train loss: -0.0016, rewards: 0.7029\n",
      "Iteration: 520, Train loss: 0.0064, rewards: 0.6914\n",
      "Iteration: 525, Train loss: 0.0073, rewards: 0.7200\n",
      "Iteration: 530, Train loss: 0.0005, rewards: 0.6171\n",
      "Iteration: 535, Train loss: 0.0007, rewards: 0.7023\n",
      "Iteration: 540, Train loss: 0.0151, rewards: 0.6857\n",
      "Iteration: 545, Train loss: 0.0163, rewards: 0.7029\n",
      "Iteration: 550, Train loss: 0.0185, rewards: 0.7257\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7629, Hits@10: 0.8351, MRR: 0.7436\n",
      "------------------------------------------------------------\n",
      "Iteration: 555, Train loss: 0.0100, rewards: 0.6794\n",
      "Iteration: 560, Train loss: 0.0182, rewards: 0.7369\n",
      "Iteration: 565, Train loss: 0.0128, rewards: 0.6771\n",
      "Iteration: 570, Train loss: 0.0055, rewards: 0.6514\n",
      "Iteration: 575, Train loss: 0.0067, rewards: 0.6869\n",
      "Iteration: 580, Train loss: 0.0038, rewards: 0.6686\n",
      "Iteration: 585, Train loss: 0.0038, rewards: 0.7371\n",
      "Iteration: 590, Train loss: 0.0123, rewards: 0.7029\n",
      "Iteration: 595, Train loss: 0.0097, rewards: 0.7429\n",
      "Iteration: 600, Train loss: 0.0034, rewards: 0.6506\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7526, Hits@10: 0.8351, MRR: 0.7456\n",
      "------------------------------------------------------------\n",
      "Iteration: 605, Train loss: -0.0018, rewards: 0.7083\n",
      "Iteration: 610, Train loss: 0.0056, rewards: 0.7429\n",
      "Iteration: 615, Train loss: 0.0051, rewards: 0.7486\n",
      "Iteration: 620, Train loss: 0.0022, rewards: 0.7143\n",
      "Iteration: 625, Train loss: 0.0079, rewards: 0.7183\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 630, Train loss: -0.0084, rewards: 0.6743\n",
      "Iteration: 635, Train loss: 0.0048, rewards: 0.7029\n",
      "Iteration: 640, Train loss: 0.0015, rewards: 0.6914\n",
      "Iteration: 645, Train loss: 0.0088, rewards: 0.7540\n",
      "Iteration: 650, Train loss: 0.0121, rewards: 0.6686\n",
      "Eval:\n",
      "Hits@1: 0.7113, Hits@3: 0.7629, Hits@10: 0.8351, MRR: 0.7467\n",
      "------------------------------------------------------------\n",
      "Iteration: 655, Train loss: 0.0070, rewards: 0.7200\n",
      "Iteration: 660, Train loss: 0.0162, rewards: 0.6400\n",
      "Iteration: 665, Train loss: 0.0161, rewards: 0.6797\n",
      "Iteration: 670, Train loss: 0.0052, rewards: 0.7143\n",
      "Iteration: 675, Train loss: 0.0080, rewards: 0.7029\n",
      "Iteration: 680, Train loss: 0.0087, rewards: 0.6914\n",
      "Iteration: 685, Train loss: 0.0129, rewards: 0.6229\n",
      "Iteration: 690, Train loss: -0.0002, rewards: 0.7371\n",
      "Iteration: 695, Train loss: 0.0123, rewards: 0.6800\n",
      "Iteration: 700, Train loss: 0.0105, rewards: 0.6514\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7441\n",
      "------------------------------------------------------------\n",
      "Iteration: 705, Train loss: 0.0076, rewards: 0.7366\n",
      "Iteration: 710, Train loss: 0.0067, rewards: 0.6629\n",
      "Iteration: 715, Train loss: 0.0173, rewards: 0.7486\n",
      "Iteration: 720, Train loss: -0.0124, rewards: 0.6580\n",
      "Iteration: 725, Train loss: 0.0087, rewards: 0.7026\n",
      "Iteration: 730, Train loss: 0.0154, rewards: 0.6857\n",
      "Iteration: 735, Train loss: 0.0182, rewards: 0.6789\n",
      "Iteration: 740, Train loss: -0.0046, rewards: 0.7371\n",
      "Iteration: 745, Train loss: 0.0055, rewards: 0.6226\n",
      "Iteration: 750, Train loss: 0.0155, rewards: 0.6857\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7629, Hits@10: 0.8454, MRR: 0.7366\n",
      "------------------------------------------------------------\n",
      "Iteration: 755, Train loss: -0.0000, rewards: 0.7103\n",
      "Iteration: 760, Train loss: 0.0065, rewards: 0.7257\n",
      "Iteration: 765, Train loss: 0.0150, rewards: 0.7251\n",
      "Iteration: 770, Train loss: -0.0029, rewards: 0.7314\n",
      "Iteration: 775, Train loss: -0.0058, rewards: 0.6800\n",
      "Iteration: 780, Train loss: 0.0019, rewards: 0.7543\n",
      "Iteration: 785, Train loss: -0.0037, rewards: 0.7063\n",
      "Iteration: 790, Train loss: 0.0140, rewards: 0.7543\n",
      "Iteration: 795, Train loss: 0.0004, rewards: 0.6629\n",
      "Iteration: 800, Train loss: -0.0008, rewards: 0.6403\n",
      "Eval:\n",
      "Hits@1: 0.6598, Hits@3: 0.7732, Hits@10: 0.8351, MRR: 0.7250\n",
      "------------------------------------------------------------\n",
      "Iteration: 805, Train loss: 0.0031, rewards: 0.7663\n",
      "Iteration: 810, Train loss: 0.0060, rewards: 0.7314\n",
      "Iteration: 815, Train loss: 0.0021, rewards: 0.7314\n",
      "Iteration: 820, Train loss: 0.0137, rewards: 0.7314\n",
      "Iteration: 825, Train loss: 0.0197, rewards: 0.6686\n",
      "Iteration: 830, Train loss: -0.0008, rewards: 0.7251\n",
      "Iteration: 835, Train loss: -0.0096, rewards: 0.7600\n",
      "Iteration: 840, Train loss: -0.0041, rewards: 0.7783\n",
      "Iteration: 845, Train loss: 0.0260, rewards: 0.7086\n",
      "Iteration: 850, Train loss: -0.0030, rewards: 0.6906\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7732, Hits@10: 0.8247, MRR: 0.7357\n",
      "------------------------------------------------------------\n",
      "Iteration: 855, Train loss: 0.0024, rewards: 0.7543\n",
      "Iteration: 860, Train loss: 0.0077, rewards: 0.7074\n",
      "Iteration: 865, Train loss: -0.0030, rewards: 0.7543\n",
      "Iteration: 870, Train loss: 0.0133, rewards: 0.7143\n",
      "Iteration: 875, Train loss: 0.0011, rewards: 0.6343\n",
      "Iteration: 880, Train loss: 0.0083, rewards: 0.7200\n",
      "Iteration: 885, Train loss: 0.0045, rewards: 0.7340\n",
      "Iteration: 890, Train loss: 0.0036, rewards: 0.7143\n",
      "Iteration: 895, Train loss: 0.0052, rewards: 0.7143\n",
      "Iteration: 900, Train loss: 0.0054, rewards: 0.6686\n",
      "Eval:\n",
      "Hits@1: 0.6804, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7397\n",
      "------------------------------------------------------------\n",
      "Iteration: 905, Train loss: 0.0039, rewards: 0.7143\n",
      "Iteration: 910, Train loss: -0.0050, rewards: 0.7486\n",
      "Iteration: 915, Train loss: 0.0016, rewards: 0.7200\n",
      "Iteration: 920, Train loss: -0.0015, rewards: 0.7257\n",
      "Iteration: 925, Train loss: 0.0132, rewards: 0.6800\n",
      "Iteration: 930, Train loss: 0.0058, rewards: 0.7143\n",
      "Iteration: 935, Train loss: 0.0081, rewards: 0.7714\n",
      "Iteration: 940, Train loss: -0.0031, rewards: 0.7200\n",
      "Iteration: 945, Train loss: -0.0009, rewards: 0.6971\n",
      "Iteration: 950, Train loss: 0.0143, rewards: 0.6400\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7440\n",
      "------------------------------------------------------------\n",
      "Iteration: 955, Train loss: 0.0063, rewards: 0.7314\n",
      "Iteration: 960, Train loss: 0.0141, rewards: 0.7086\n",
      "Iteration: 965, Train loss: 0.0022, rewards: 0.6457\n",
      "Iteration: 970, Train loss: 0.0060, rewards: 0.7829\n",
      "Iteration: 975, Train loss: -0.0053, rewards: 0.6743\n",
      "Iteration: 980, Train loss: 0.0081, rewards: 0.7086\n",
      "Iteration: 985, Train loss: 0.0182, rewards: 0.7714\n",
      "Iteration: 990, Train loss: 0.0076, rewards: 0.6914\n",
      "Iteration: 995, Train loss: 0.0130, rewards: 0.7186\n",
      "Iteration: 1000, Train loss: 0.0165, rewards: 0.7029\n",
      "Eval:\n",
      "Hits@1: 0.7010, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7495\n",
      "------------------------------------------------------------\n",
      "Iteration: 1005, Train loss: 0.0005, rewards: 0.6989\n",
      "Iteration: 1010, Train loss: 0.0052, rewards: 0.7714\n",
      "Iteration: 1015, Train loss: 0.0013, rewards: 0.7029\n",
      "Iteration: 1020, Train loss: 0.0094, rewards: 0.7143\n",
      "Iteration: 1025, Train loss: 0.0061, rewards: 0.6914\n",
      "Iteration: 1030, Train loss: 0.0024, rewards: 0.6800\n",
      "Iteration: 1035, Train loss: 0.0109, rewards: 0.7086\n",
      "Iteration: 1040, Train loss: 0.0009, rewards: 0.6571\n",
      "Iteration: 1045, Train loss: 0.0195, rewards: 0.7543\n",
      "Iteration: 1050, Train loss: 0.0061, rewards: 0.6914\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7938, Hits@10: 0.8351, MRR: 0.7409\n",
      "------------------------------------------------------------\n",
      "Iteration: 1055, Train loss: -0.0116, rewards: 0.6914\n",
      "Iteration: 1060, Train loss: 0.0068, rewards: 0.6914\n",
      "Iteration: 1065, Train loss: 0.0092, rewards: 0.7029\n",
      "Iteration: 1070, Train loss: 0.0089, rewards: 0.6743\n",
      "Iteration: 1075, Train loss: 0.0193, rewards: 0.6686\n",
      "Iteration: 1080, Train loss: -0.0026, rewards: 0.6743\n",
      "Iteration: 1085, Train loss: 0.0164, rewards: 0.7143\n",
      "Iteration: 1090, Train loss: 0.0173, rewards: 0.7200\n",
      "Iteration: 1095, Train loss: 0.0046, rewards: 0.7257\n",
      "Iteration: 1100, Train loss: 0.0080, rewards: 0.7143\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.8041, Hits@10: 0.8351, MRR: 0.7418\n",
      "------------------------------------------------------------\n",
      "Iteration: 1105, Train loss: -0.0033, rewards: 0.7143\n",
      "Iteration: 1110, Train loss: 0.0021, rewards: 0.6457\n",
      "Iteration: 1115, Train loss: 0.0075, rewards: 0.6629\n",
      "Iteration: 1120, Train loss: -0.0010, rewards: 0.7143\n",
      "Iteration: 1125, Train loss: 0.0150, rewards: 0.7029\n",
      "Iteration: 1130, Train loss: 0.0069, rewards: 0.7371\n",
      "Iteration: 1135, Train loss: 0.0121, rewards: 0.7200\n",
      "Iteration: 1140, Train loss: -0.0039, rewards: 0.7657\n",
      "Iteration: 1145, Train loss: -0.0007, rewards: 0.6514\n",
      "Iteration: 1150, Train loss: -0.0027, rewards: 0.6800\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7835, Hits@10: 0.8351, MRR: 0.7393\n",
      "------------------------------------------------------------\n",
      "Iteration: 1155, Train loss: 0.0039, rewards: 0.7371\n",
      "Iteration: 1160, Train loss: 0.0096, rewards: 0.7200\n",
      "Iteration: 1165, Train loss: -0.0012, rewards: 0.7143\n",
      "Iteration: 1170, Train loss: 0.0089, rewards: 0.7600\n",
      "Iteration: 1175, Train loss: -0.0073, rewards: 0.7086\n",
      "Iteration: 1180, Train loss: 0.0060, rewards: 0.6514\n",
      "Iteration: 1185, Train loss: 0.0028, rewards: 0.7086\n",
      "Iteration: 1190, Train loss: 0.0033, rewards: 0.7600\n",
      "Iteration: 1195, Train loss: 0.0012, rewards: 0.6743\n",
      "Iteration: 1200, Train loss: 0.0061, rewards: 0.6800\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7835, Hits@10: 0.8351, MRR: 0.7393\n",
      "------------------------------------------------------------\n",
      "Iteration: 1205, Train loss: 0.0008, rewards: 0.7829\n",
      "Iteration: 1210, Train loss: 0.0134, rewards: 0.7257\n",
      "Iteration: 1215, Train loss: 0.0096, rewards: 0.6857\n",
      "Iteration: 1220, Train loss: -0.0014, rewards: 0.7429\n",
      "Iteration: 1225, Train loss: 0.0046, rewards: 0.7257\n",
      "Iteration: 1230, Train loss: -0.0005, rewards: 0.7771\n",
      "Iteration: 1235, Train loss: -0.0017, rewards: 0.7486\n",
      "Iteration: 1240, Train loss: -0.0106, rewards: 0.6971\n",
      "Iteration: 1245, Train loss: 0.0021, rewards: 0.6914\n",
      "Iteration: 1250, Train loss: 0.0070, rewards: 0.6800\n",
      "Eval:\n",
      "Hits@1: 0.6907, Hits@3: 0.7835, Hits@10: 0.8351, MRR: 0.7393\n",
      "------------------------------------------------------------\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 1255, Train loss: -0.0045, rewards: 0.6914\n",
      "Iteration: 1260, Train loss: 0.0115, rewards: 0.7543\n",
      "Iteration: 1265, Train loss: -0.0040, rewards: 0.7486\n"
     ]
    }
   ],
   "source": [
    "sub_task = sub_tasks_list[0]\n",
    "study = optuna.create_study(storage=f\"sqlite:///{sub_task}.db\", study_name=f\"{sub_task}\", direction = 'maximize')\n",
    "study.optimize(objective, n_trials=1000)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
