{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Test Notebook\n",
    "!ls"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "# Specify the file paths for the dataset files\n",
    "users_path = \"../datasets/ml-1m/users.dat\"\n",
    "ratings_path = \"../datasets/ml-1m/ratings.dat\"\n",
    "movies_path = \"../datasets/ml-1m/movies.dat\"\n",
    "\n",
    "\n",
    "# Define column names for each dataset\n",
    "users_cols = ['user_id', 'gender', 'age', 'occupation', 'zip_code']\n",
    "ratings_cols = ['user_id', 'movie_id', 'rating', 'timestamp']\n",
    "movies_cols = ['movie_id', 'title', 'genres']\n",
    "\n",
    "# Load data into Pandas DataFrames\n",
    "users_df = pd.read_csv(users_path, sep='::', header=None, names=users_cols, encoding='latin-1', engine='python')\n",
    "ratings_df = pd.read_csv(ratings_path, sep='::', header=None, names=ratings_cols, encoding='latin-1', engine='python')\n",
    "movies_df = pd.read_csv(movies_path, sep='::', header=None, names=movies_cols, encoding='latin-1', engine='python')\n",
    "\n",
    "# Display the first few rows of each DataFrame\n",
    "print(\"Users DataFrame:\")\n",
    "print(users_df.head())\n",
    "\n",
    "print(\"\\nRatings DataFrame:\")\n",
    "print(ratings_df.head())\n",
    "\n",
    "print(\"\\nMovies DataFrame:\")\n",
    "print(movies_df.head())\n",
    "\n",
    "# Optionally, convert DataFrames to NumPy arrays/matrices\n",
    "users_array = users_df.values\n",
    "ratings_array = ratings_df.values\n",
    "movies_array = movies_df.values\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df = pd.merge(ratings_df, movies_df)[['user_id', 'title', 'rating', 'timestamp']]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df[\"user_id\"] = ratings_df[\"user_id\"].astype(str)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "General Dataset Statistics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_user = ratings_df.groupby('user_id').rating.count()\n",
    "ratings_per_item = ratings_df.groupby('title').rating.count()\n",
    "\n",
    "print(f\"Total No. of users: {len(ratings_df.user_id.unique())}\")\n",
    "print(f\"Total No. of items: {len(ratings_df.title.unique())}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max observed rating: {ratings_df.rating.max()}\")\n",
    "print(f\"Min observed rating: {ratings_df.rating.min()}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max no. of user ratings: {ratings_per_user.max()}\")\n",
    "print(f\"Min no. of user ratings: {ratings_per_user.min()}\")\n",
    "print(f\"Median no. of ratings per user: {ratings_per_user.median()}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max no. of item ratings: {ratings_per_item.max()}\")\n",
    "print(f\"Min no. of item ratings: {ratings_per_item.min()}\")\n",
    "print(f\"Median no. of ratings per item: {ratings_per_item.median()}\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lookup = {v: i+1 for i, v in enumerate(ratings_df['user_id'].unique())}\n",
    "user_lookup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "movie_lookup = {v: i+1 for i, v in enumerate(ratings_df['title'].unique())}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df['movie_id'] = ratings_df['title'].map(movie_lookup)\n",
    "ratings_df['user_int'] = ratings_df['user_id'].map(user_lookup)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Popularity Bias check"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_item_rating_tuples = ratings_df[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "\n",
    "class MfDotBias(nn.Module):\n",
    "\n",
    "    def __init__(\n",
    "        self, n_factors, n_users, n_items, ratings_range=[1,5], use_biases=False\n",
    "    ):\n",
    "        super().__init__()\n",
    "        self.bias = use_biases\n",
    "        self.y_range = ratings_range\n",
    "        self.user_embedding = nn.Embedding(n_users+1, n_factors, padding_idx=0)\n",
    "        self.item_embedding = nn.Embedding(n_items+1, n_factors, padding_idx=0)\n",
    "\n",
    "        if use_biases:\n",
    "            self.user_bias = nn.Embedding(n_users+1, 1, padding_idx=0)\n",
    "            self.item_bias = nn.Embedding(n_items+1, 1, padding_idx=0)\n",
    "\n",
    "    def forward(self, inputs):\n",
    "        users, items = inputs\n",
    "        dot = self.user_embedding(users) * self.item_embedding(items)\n",
    "        result = dot.sum(1)\n",
    "        if self.bias:\n",
    "            result = (\n",
    "                result + self.user_bias(users).squeeze() + self.item_bias(items).squeeze()\n",
    "            )\n",
    "\n",
    "        if self.y_range is None:\n",
    "            return result\n",
    "        else:\n",
    "            return (\n",
    "                torch.sigmoid(result) * (self.y_range[1] - self.y_range[0])\n",
    "                + self.y_range[0]\n",
    "            )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from tqdm import tqdm\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(user_item_rating_tuples, dtype=torch.long)\n",
    "#valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "#valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 10  # Adjust as needed\n",
    "n_users = train_users.max().item() + 1\n",
    "print(\"Number of users:\", n_users)\n",
    "n_items = train_items.max().item() + 1\n",
    "print(\"Number of items:\", n_items)\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "print(\"Shape of dataset: \", len(train_dataset))\n",
    "print(\"Length of train loader: \", len(train_loader))\n",
    "# Training loop\n",
    "n_epochs = 10  # Adjust as needed\n",
    "for epoch in range(n_epochs):\n",
    "    model.train()\n",
    "    for batch_users, batch_items, batch_ratings in tqdm(train_loader):\n",
    "        optimizer.zero_grad()\n",
    "        predictions = model((batch_users, batch_items))\n",
    "        loss = criterion(predictions, batch_ratings.float())\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "    # Validation\n",
    "    # model.eval()\n",
    "    # with torch.no_grad():\n",
    "    #     valid_predictions = model((valid_users, valid_items))\n",
    "    #     valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "    print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}') #, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "# Optionally, save the trained model\n",
    "torch.save(model.state_dict(), 'mf_model_unbiased.pth')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.load_state_dict(torch.load('mf_model_unbiased.pth'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create a dictionary to store user-item mappings\n",
    "user_item_dict = {}\n",
    "# Iterate through train_data and collect items for each user\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id.item() not in user_item_dict:\n",
    "        user_item_dict[user_id.item()] = [item_id.item()]\n",
    "    else:\n",
    "        user_item_dict[user_id.item()].append(item_id.item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Testing\n",
    "model.user_embedding(torch.tensor(6041))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.item_embedding(torch.tensor(1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.is_available()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.device_count()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.current_device()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.get_device_name(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from collections import defaultdict\n",
    "ratings_per_item_lookup = defaultdict(int)\n",
    "for item_name, num_ratings in ratings_per_item.items():\n",
    "    item_number = movie_lookup.get(item_name)\n",
    "    if item_number is not None:\n",
    "        ratings_per_item_lookup[item_number] += num_ratings\n",
    "\n",
    "# Convert defaultdict to a regular dictionary\n",
    "ratings_per_item_lookup = dict(ratings_per_item_lookup)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_items_by_ratings = sorted(ratings_per_item_lookup.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "# Create a popularity_dict based on the sorted list\n",
    "popularity_dict = {item: rank for rank, (item, count) in enumerate(sorted_items_by_ratings, start=1)}\n",
    "\n",
    "print(\"Popularity dictionary:\", popularity_dict)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Predicted rating for user 25 on item 5\n",
    "inp = [torch.tensor([25]), torch.tensor([5])]\n",
    "print(model(inp).item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Consider user no. 25\n",
    "predicted_ratings = {index: None for index in range(1, n_items + 1)}\n",
    "for item in range(1, n_items+1):\n",
    "    item_rating = model([torch.tensor([25]), torch.tensor([item])]).item()\n",
    "    predicted_ratings[item] = item_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "count_var = 0\n",
    "top_10_item_names=[]\n",
    "for i in sorted_pred_ratings:\n",
    "    item_id = i[0]\n",
    "    if item_id not in user_item_dict[25]:\n",
    "        count_var+=1\n",
    "        top_10_item_names.append(item_id)\n",
    "    if count_var==10:\n",
    "        break\n",
    "print(top_10_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#See average popularity of initial recommendations\n",
    "#Let's take a random user, say 25\n",
    "total_popularity=0\n",
    "for i in top_10_item_names:\n",
    "    total_popularity+=popularity_dict[i]\n",
    "    #print(popularity_dict[i])\n",
    "print(total_popularity/10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.user_embedding(torch.tensor([25]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendations(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(1, n_items + 1)}\n",
    "    for item in range(1, n_items+1):\n",
    "        dot = user_vector * model.item_embedding(torch.tensor([item]))\n",
    "        result = dot.sum(1)\n",
    "        result = torch.sigmoid(result) * (model.y_range[1] - model.y_range[0]) + model.y_range[0]\n",
    "        # result = (\n",
    "        #     result + user_bias + model.item_bias(torch.tensor([item])).squeeze()\n",
    "        # )\n",
    "        item_rating = result.item()\n",
    "        #item_rating = model([torch.tensor([uid]), torch.tensor([item])]).item()\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_popularity(recommendations):\n",
    "    total_popularity=0\n",
    "    for i in recommendations:\n",
    "        total_popularity+=popularity_dict[i]\n",
    "        #print(popularity_dict[i])\n",
    "    return total_popularity/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#torch.tensor([25]), torch.tensor([5])\n",
    "dot = model.user_embedding(torch.tensor([25])) * model.item_embedding(torch.tensor([5]))\n",
    "result = dot.sum(1)\n",
    "result = torch.sigmoid(result) * (model.y_range[1] - model.y_range[0]) + model.y_range[0]\n",
    "# result = (\n",
    "#     result + model.user_bias(torch.tensor([25])).squeeze() + model.item_bias(torch.tensor([5])).squeeze()\n",
    "# )\n",
    "print(result.item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def calculate_error(user_vector, ratings):\n",
    "#     error_sum = 0\n",
    "#     for item, rating in ratings.items():\n",
    "#         item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "#         error_sum += (torch.dot(user_vector, item_vector) - rating)**2\n",
    "#     return error_sum\n",
    "\n",
    "# def update_user_latent_vector(user_vector, item_vectors, ratings, learning_rate):\n",
    "#     error_sum = 0\n",
    "#     for item, rating in ratings.items():\n",
    "#         item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "#         error_sum += 2 * (torch.dot(user_vector, item_vector) - rating) * item_vector\n",
    "#     gradient = error_sum\n",
    "#     updated_user_vector = user_vector - learning_rate * gradient\n",
    "#     return updated_user_vector\n",
    "\n",
    "# def update_user_vector(user_vector, ratings, learning_rate=0.01, max_iterations=100, convergence_threshold=1e-5):\n",
    "#     prev_error = float('inf')\n",
    "#     for iteration in range(max_iterations):\n",
    "#         error = calculate_error(user_vector, ratings)\n",
    "#         #print(prev_error - error)\n",
    "#         if abs(prev_error - error) < convergence_threshold:\n",
    "#             break\n",
    "        \n",
    "#         user_vector = update_user_latent_vector(user_vector, model.item_embedding, ratings, learning_rate)\n",
    "#         prev_error = error\n",
    "#     return user_vector\n",
    "def calculate_error(user_vector, ratings):\n",
    "    error_sum = 0\n",
    "    for item, rating in ratings.items():\n",
    "        item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "        dot = torch.dot(user_vector, item_vector)\n",
    "        predicted_rating = torch.sigmoid(dot) * (model.y_range[1] - model.y_range[0]) + model.y_range[0]\n",
    "        error_sum += (predicted_rating - rating)**2\n",
    "    return error_sum\n",
    "\n",
    "def update_user_latent_vector(user_vector, item_vectors, ratings, learning_rate):\n",
    "    error_sum = 0\n",
    "    for item, rating in ratings.items():\n",
    "        item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "        dot = torch.dot(user_vector, item_vector)\n",
    "        predicted_rating = torch.sigmoid(dot) * (model.y_range[1] - model.y_range[0]) + model.y_range[0]\n",
    "        error_sum += 2 * (predicted_rating - rating) * torch.sigmoid(dot) * (1 - torch.sigmoid(dot)) * item_vector\n",
    "    gradient = error_sum\n",
    "    updated_user_vector = user_vector - learning_rate * gradient\n",
    "    return updated_user_vector\n",
    "\n",
    "def update_user_vector(user_vector, ratings, learning_rate=0.01, max_iterations=100, convergence_threshold=1e-5):\n",
    "    prev_error = float('inf')\n",
    "    for iteration in range(max_iterations):\n",
    "        error = calculate_error(user_vector, ratings)\n",
    "        if abs(prev_error - error) < convergence_threshold:\n",
    "            break\n",
    "        \n",
    "        user_vector = update_user_latent_vector(user_vector, model.item_embedding, ratings, learning_rate)\n",
    "        prev_error = error\n",
    "    return user_vector\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=25\n",
    "ratings={}\n",
    "already_rated=[]\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id!=uid:\n",
    "        continue\n",
    "    ratings[item_id.item()] = rating.item()\n",
    "    already_rated.append(item_id.item())\n",
    "print(\"Ratings acquired\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Start with uniform choice and positive feedback models\n",
    "#As neither present any systematic user preference, any change in trajectory popularity cannot be attributed to the user.\n",
    "time_max=150\n",
    "avg_popularity=[]\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    avg_popularity.append(get_popularity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, ratings)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_popularity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 25\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Diversity Bias\n",
    "#Basically the same, find the diversity of the recommendation list\n",
    "#What metric do you use for diversity? Distance between the latent representations of items?\n",
    "#1 - cosine_similarity\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "import itertools\n",
    "\n",
    "def compute_diversity(rec_list):\n",
    "    item_embeddings = [model.item_embedding(torch.tensor([item]))[0].detach().numpy() for item in rec_list]\n",
    "    #print(item_embeddings)\n",
    "    cosine_similarities = cosine_similarity(item_embeddings, item_embeddings)\n",
    "    cosine_similarities_flat = cosine_similarities[np.triu_indices(len(rec_list), k=1)]\n",
    "    one_minus_cosine_similarities = 1 - cosine_similarities_flat\n",
    "    # Compute the average\n",
    "    average_diversity = one_minus_cosine_similarities.mean()\n",
    "    return average_diversity\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=25\n",
    "ratings={}\n",
    "already_rated=[]\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id!=uid:\n",
    "        continue\n",
    "    ratings[item_id.item()] = rating.item()\n",
    "    already_rated.append(item_id.item())\n",
    "print(\"Ratings acquired\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "time_max=150\n",
    "diversity=[]\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    diversity.append(compute_diversity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, ratings)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "diversity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 25\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=25\n",
    "ratings={}\n",
    "already_rated=[]\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id!=uid:\n",
    "        continue\n",
    "    ratings[item_id.item()] = rating.item()\n",
    "    already_rated.append(item_id.item())\n",
    "print(\"Ratings acquired\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def full_list_pop(recommendations):\n",
    "    l=[]\n",
    "    for i in recommendations:\n",
    "        l.append(popularity_dict[i])\n",
    "    return l"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Now for popularity-based choice, #sanity check\n",
    "time_max=150\n",
    "avg_popularity=[]\n",
    "alpha = 0.5\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    avg_popularity.append(get_popularity(recommendations))\n",
    "    full_list_popularity=full_list_pop(recommendations)\n",
    "    probabilities = np.exp(alpha) * np.array(full_list_popularity)\n",
    "    probabilities /= probabilities.sum()\n",
    "    chosen_index = np.random.choice(len(full_list_popularity), p=probabilities)\n",
    "    choice_of_item = recommendations[chosen_index]\n",
    "    if popularity_dict[choice_of_item]<=300:\n",
    "        ratings[choice_of_item] = 5\n",
    "    else:\n",
    "        ratings[choice_of_item] = 1\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, ratings)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_popularity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 25 with popularity based choice\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Set the most recent interactions as the test set. Remove users that don't appear in the training set from the test set."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Step 1: Sort ratings by timestamp\n",
    "ratings_sorted = ratings_df.sort_values(by='timestamp')\n",
    "\n",
    "# Step 2: Split dataset into training and validation sets\n",
    "total_ratings = len(ratings_sorted)\n",
    "validation_size = int(0.3 * total_ratings)\n",
    "\n",
    "validation_set = ratings_sorted.tail(validation_size)\n",
    "training_set = ratings_sorted.head(total_ratings - validation_size)\n",
    "\n",
    "train_users = training_set['user_id'].unique()\n",
    "validation_set_filtered = validation_set[validation_set['user_id'].isin(train_users)]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(training_set.user_id.unique())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_user_item_rating_tuples = training_set[['user_int', 'movie_id', 'rating']].values.tolist()\n",
    "valid_user_item_rating_tuples = validation_set_filtered[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(train_user_item_rating_tuples, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 10  # Adjust as needed\n",
    "n_users = max(train_users.max(), valid_users.max()).item() + 1\n",
    "n_items = max(train_items.max(), valid_items.max()).item() + 1\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "\n",
    "# Training loop\n",
    "n_epochs = 20  # Adjust as needed\n",
    "for epoch in range(n_epochs):\n",
    "    model.train()\n",
    "    for batch_users, batch_items, batch_ratings in train_loader:\n",
    "        optimizer.zero_grad()\n",
    "        predictions = model((batch_users, batch_items))\n",
    "        loss = criterion(predictions, batch_ratings.float())\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "    # Validation\n",
    "    model.eval()\n",
    "    with torch.no_grad():\n",
    "        valid_predictions = model((valid_users, valid_items))\n",
    "        valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "    print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "# Optionally, save the trained model\n",
    "torch.save(model.state_dict(), 'mf_model.pth')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Method-2: Mark last n ratings by each user as the test set."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mark_last_n_ratings_as_validation_set(ratings_df, 1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_df = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "median_rating = train_df.rating.median()\n",
    "median_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import math\n",
    "from sklearn.metrics import mean_squared_error, mean_absolute_error\n",
    "\n",
    "predictions = np.array([median_rating]* len(valid_df))\n",
    "\n",
    "mae = mean_absolute_error(valid_df.rating, predictions)\n",
    "mse = mean_squared_error(valid_df.rating, predictions)\n",
    "rmse = math.sqrt(mse)\n",
    "\n",
    "print(f'mae: {mae}')\n",
    "print(f'mse: {mse}')\n",
    "print(f'rmse: {rmse}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_user_item_rating_tuples = train_df[['user_int', 'movie_id', 'rating']].values.tolist()\n",
    "valid_user_item_rating_tuples = valid_df[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(train_user_item_rating_tuples, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 10  # Adjust as needed\n",
    "n_users = max(train_users.max(), valid_users.max()).item() + 1\n",
    "n_items = max(train_items.max(), valid_items.max()).item() + 1\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "\n",
    "# Training loop\n",
    "n_epochs = 20  # Adjust as needed\n",
    "for epoch in range(n_epochs):\n",
    "    model.train()\n",
    "    for batch_users, batch_items, batch_ratings in train_loader:\n",
    "        optimizer.zero_grad()\n",
    "        predictions = model((batch_users, batch_items))\n",
    "        loss = criterion(predictions, batch_ratings.float())\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "    # Validation\n",
    "    model.eval()\n",
    "    with torch.no_grad():\n",
    "        valid_predictions = model((valid_users, valid_items))\n",
    "        valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "    print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "# Optionally, save the trained model\n",
    "torch.save(model.state_dict(), 'mf_model.pth')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Recurrent Recommender Network"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# -*- Encoding:UTF-8 -*-\n",
    "\n",
    "import pandas as pd\n",
    "\n",
    "\n",
    "class Data:\n",
    "    def __init__(self, name='ml-1m'):\n",
    "        self.dataName = name\n",
    "        self.dataPath = \"../datasets/\" + self.dataName + \"/\"\n",
    "        # Static Profile\n",
    "        self.UserInfo = self.getUserInfo()\n",
    "        self.MovieInfo = self.getMovieInfo()\n",
    "\n",
    "        self.data = self.getData()\n",
    "\n",
    "    def getUserInfo(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            userInfoPath = self.dataPath + \"users.dat\"\n",
    "\n",
    "            users_title = ['UserID', 'Gender', 'Age', 'JobID', 'Zip-code']\n",
    "            users = pd.read_table(userInfoPath, sep='::', header=None, names=users_title, engine='python', encoding='latin-1')\n",
    "            users = users.filter(regex='UserID|Gender|Age|JobID')\n",
    "            users_orig = users.values\n",
    "\n",
    "            # 将性别映射到0,1\n",
    "            gender_map = {'F': 0, 'M': 1}\n",
    "            users['Gender'] = users['Gender'].map(gender_map)\n",
    "            # 将年龄组映射到0-6\n",
    "            age_map = {val: idx for idx, val in enumerate(set(users['Age']))}\n",
    "            users['Age'] = users['Age'].map(age_map)\n",
    "\n",
    "            return users\n",
    "\n",
    "    def getMovieInfo(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            movieInfoPath = self.dataPath + \"movies.dat\"\n",
    "\n",
    "            movies_title = ['MovieID', 'Title', 'Genres']\n",
    "            movies = pd.read_table(movieInfoPath, sep='::', header=None, names=movies_title, engine='python', encoding='latin-1')\n",
    "            movies = movies.filter(regex='MovieID|Genres')\n",
    "\n",
    "            #电影类型映射到0-18\n",
    "            genres_set = set()\n",
    "            for val in movies['Genres'].str.split('|'):\n",
    "                genres_set.update(val)\n",
    "            genres2int = {val: idx for idx, val in enumerate(genres_set)}\n",
    "            genres_map = {val: [genres2int[row] for row in val.split('|')] for ii, val in enumerate(set(movies['Genres']))}\n",
    "            movies['Genres'] = movies['Genres'].map(genres_map)\n",
    "\n",
    "            return movies\n",
    "\n",
    "    def getData(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            dataPath = self.dataPath + \"ratings.dat\"\n",
    "\n",
    "            ratings_title = ['UserID', 'MovieID', 'Rating', 'TimeStamp']\n",
    "            ratings = pd.read_table(dataPath, sep='::', header=None, names=ratings_title, engine='python', encoding='latin-1')\n",
    "\n",
    "            data = pd.merge(pd.merge(ratings, self.UserInfo), self.MovieInfo)\n",
    "            data = data.sort_values(by=['TimeStamp'])\n",
    "            #print(data.head())\n",
    "\n",
    "            # Step 1: Sort ratings by timestamp\n",
    "\n",
    "            # Step 2: Split dataset into training and validation sets\n",
    "            total_ratings = len(data)\n",
    "            validation_size = int(0.3 * total_ratings)\n",
    "\n",
    "            validation_set = data.tail(validation_size)\n",
    "            training_set = data.head(total_ratings - validation_size)\n",
    "\n",
    "            \n",
    "            train_users = training_set['UserID'].unique()\n",
    "            validation_set_filtered = validation_set[validation_set['UserID'].isin(train_users)]\n",
    "            \n",
    "            return training_set, validation_set_filtered\n",
    "\n",
    "if __name__ == '__main__':\n",
    "    data = Data()\n",
    "    print(len(data.data))\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# -*- Encoding:UTF-8 -*-\n",
    "\n",
    "import tensorflow.compat.v1 as tf\n",
    "tf.disable_v2_behavior()\n",
    "import numpy as np\n",
    "import sys\n",
    "\n",
    "def main():\n",
    "    model = RRN()\n",
    "    model.run()\n",
    "\n",
    "\n",
    "class RRN:\n",
    "    def __init__(self):\n",
    "        # params parser\n",
    "        self.batch_size = 50\n",
    "        self.n_step = 1\n",
    "        self.lr = 0.01\n",
    "        self.verbose = 100\n",
    "        # Data\n",
    "        dataSet = Data(\"ml-1m\")\n",
    "        a, b = dataSet.data\n",
    "        self.train=a.values\n",
    "        self.valid=b.values\n",
    "        # Model\n",
    "        self.add_placeholder()\n",
    "        self.add_embedding_layer()\n",
    "        self.add_rnn_layer()\n",
    "        self.add_pred_layer()\n",
    "        self.add_loss()\n",
    "        self.add_train_step()\n",
    "        self.init_session()\n",
    "\n",
    "    def add_placeholder(self):\n",
    "        # user placeholder\n",
    "        self.userID = tf.placeholder(tf.int32, shape=[None, 1], name=\"userID\")\n",
    "        # movie placeholder\n",
    "        self.movieID = tf.placeholder(tf.int32, shape=[None, 1], name=\"movieID\")\n",
    "        # target\n",
    "        self.rating = tf.placeholder(tf.float32, shape=[None, 1], name=\"rating\")\n",
    "        # other params\n",
    "        self.dropout = tf.placeholder(tf.float32, name='dropout')\n",
    "\n",
    "    def add_embedding_layer(self):\n",
    "        with tf.name_scope(\"userID_embedding\"):\n",
    "            # user id embedding\n",
    "            uid_onehot = tf.reshape(tf.one_hot(self.userID, 6040), shape=[-1, 6040])\n",
    "            # uid_onehot_rating = tf.multiply(self.rating, uid_onehot)\n",
    "            uid_layer = tf.layers.dense(uid_onehot, units=128, activation=tf.nn.relu)\n",
    "            self.uid_layer = tf.reshape(uid_layer, [-1, self.n_step, 128])\n",
    "\n",
    "        with tf.name_scope(\"movie_embedding\"):\n",
    "            # movie id embedding\n",
    "            mid_onehot = tf.reshape(tf.one_hot(self.movieID, 3952), shape=[-1, 3952])\n",
    "            # mid_onehot_rating = tf.multiply(self.rating, mid_onehot)\n",
    "            mid_layer = tf.layers.dense(mid_onehot, units=128, activation=tf.nn.relu)\n",
    "            self.mid_layer = tf.reshape(mid_layer, shape=[-1, self.n_step, 128])\n",
    "\n",
    "    def add_rnn_layer(self):\n",
    "        with tf.variable_scope(\"user_rnn_cell\"):\n",
    "            userCell = tf.nn.rnn_cell.GRUCell(num_units=128)\n",
    "\n",
    "            userInput = tf.transpose(self.mid_layer, [1, 0, 2])\n",
    "            # userInput = tf.reshape(userInput, [-1, 128])\n",
    "            # userInput = tf.split(userInput, self.n_step, axis=0)\n",
    "\n",
    "            userOutputs, userStates = tf.nn.dynamic_rnn(userCell, userInput, dtype=tf.float32)\n",
    "            self.userOutput = userOutputs[-1]\n",
    "        with tf.variable_scope(\"movie_rnn_cell\"):\n",
    "            movieCell = tf.nn.rnn_cell.GRUCell(num_units=128)\n",
    "\n",
    "            movieInput = tf.transpose(self.uid_layer, [1, 0, 2])\n",
    "            movieOutputs, movieStates = tf.nn.dynamic_rnn(movieCell, movieInput, dtype=tf.float32)\n",
    "            self.movieOutput = movieOutputs[-1]\n",
    "\n",
    "    def add_pred_layer(self):\n",
    "        W = {\n",
    "            'userOutput': tf.Variable(tf.random_normal(shape=[128, 64], stddev=0.1)),\n",
    "            'movieOutput': tf.Variable(tf.random_normal(shape=[128, 64], stddev=0.1))\n",
    "        }\n",
    "        b = {\n",
    "            'userOutput': tf.Variable(tf.random_normal(shape=[64], stddev=0.1)),\n",
    "            'movieOutput': tf.Variable(tf.random_normal(shape=[64], stddev=0.1))\n",
    "        }\n",
    "        userVector = tf.add(tf.matmul(self.userOutput, W['userOutput']), b['userOutput'])\n",
    "        movieVector = tf.add(tf.matmul(self.movieOutput, W['movieOutput']), b['movieOutput'])\n",
    "\n",
    "        self.pred = tf.reduce_sum(tf.multiply(userVector, movieVector), axis=1, keep_dims=True)\n",
    "\n",
    "    def add_loss(self):\n",
    "        losses = tf.losses.mean_squared_error(self.rating, self.pred)\n",
    "        self.loss = tf.reduce_mean(losses)\n",
    "\n",
    "    def add_train_step(self):\n",
    "        optimizer = tf.train.AdamOptimizer(self.lr)\n",
    "        self.train_op = optimizer.minimize(self.loss)\n",
    "\n",
    "    def init_session(self):\n",
    "        self.config = tf.ConfigProto()\n",
    "        self.config.gpu_options.allow_growth = True\n",
    "        self.config.allow_soft_placement = True\n",
    "        self.sess = tf.Session(config=self.config)\n",
    "        self.sess.run(tf.global_variables_initializer())\n",
    "\n",
    "    def run(self):\n",
    "        length = len(self.train)\n",
    "        batches = length // self.batch_size + 1\n",
    "\n",
    "        train_loss = []\n",
    "        valid_loss = []\n",
    "\n",
    "        for i in range(batches):\n",
    "            minIdx = i * self.batch_size\n",
    "            maxIdx = min(length, (i+1) * self.batch_size)\n",
    "            train_batch = self.train[minIdx:maxIdx]\n",
    "            feed_dict_train = self.createFeedDict(train_batch)\n",
    "\n",
    "            tmpLoss = self.sess.run(self.loss, feed_dict=feed_dict_train)\n",
    "            train_loss.append(tmpLoss)\n",
    "\n",
    "            self.sess.run(self.train_op, feed_dict=feed_dict_train)\n",
    "\n",
    "            if i % self.verbose == 0:\n",
    "                sys.stdout.write('\\rTraining: Batch {}/{} - Loss: {:.4f}'.format(\n",
    "                    i, batches, np.sqrt(np.mean(train_loss[-20:]))\n",
    "                ))\n",
    "                sys.stdout.flush()\n",
    "\n",
    "            # Check validation loss every verbose steps\n",
    "            # if i % self.verbose == 0 and i != 0:\n",
    "            #     # Use the entire validation set\n",
    "            #     feed_dict_valid = self.createFeedDict(self.valid)\n",
    "            #     valid_loss_epoch = self.sess.run(self.loss, feed_dict=feed_dict_valid)\n",
    "            #     valid_loss.append(np.sqrt(valid_loss_epoch))\n",
    "\n",
    "            #     sys.stdout.write(' - Validation Loss: {:.4f}'.format(valid_loss[-1]))\n",
    "            #     sys.stdout.flush()\n",
    "\n",
    "        print(\"\\nTraining Finish, Last 2000 batches loss is {}.\".format(\n",
    "            np.sqrt(np.mean(train_loss[-2000:]))\n",
    "        ))\n",
    "        feed_dict_valid = self.createFeedDict(self.valid)\n",
    "        valid_loss_epoch = self.sess.run(self.loss, feed_dict=feed_dict_valid)\n",
    "        print(\"Validation Loss: {:.4f}\".format(np.sqrt(valid_loss_epoch)))\n",
    "\n",
    "    def createFeedDict(self, data, dropout=1.):\n",
    "        userID = []\n",
    "        movieID = []\n",
    "        ratings = []\n",
    "        for i in data:\n",
    "            userID.append([i[0]-1])\n",
    "            movieID.append([i[1]-1])\n",
    "            ratings.append([float(i[2])])\n",
    "        return {\n",
    "            self.userID: np.array(userID),\n",
    "            self.movieID: np.array(movieID),\n",
    "            self.rating: np.array(ratings),\n",
    "            self.dropout: dropout\n",
    "        }\n",
    "\n",
    "\n",
    "if __name__ == '__main__':\n",
    "    main()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
