{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Test Notebook\n",
    "!ls"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "# Specify the file paths for the dataset files\n",
    "users_path = \"../datasets/ml-1m/users.dat\"\n",
    "ratings_path = \"../datasets/ml-1m/ratings.dat\"\n",
    "movies_path = \"../datasets/ml-1m/movies.dat\"\n",
    "\n",
    "\n",
    "# Define column names for each dataset\n",
    "users_cols = ['user_id', 'gender', 'age', 'occupation', 'zip_code']\n",
    "ratings_cols = ['user_id', 'movie_id', 'rating', 'timestamp']\n",
    "movies_cols = ['movie_id', 'title', 'genres']\n",
    "\n",
    "# Load data into Pandas DataFrames\n",
    "users_df = pd.read_csv(users_path, sep='::', header=None, names=users_cols, encoding='latin-1', engine='python')\n",
    "ratings_df = pd.read_csv(ratings_path, sep='::', header=None, names=ratings_cols, encoding='latin-1', engine='python')\n",
    "movies_df = pd.read_csv(movies_path, sep='::', header=None, names=movies_cols, encoding='latin-1', engine='python')\n",
    "\n",
    "# Display the first few rows of each DataFrame\n",
    "print(\"Users DataFrame:\")\n",
    "print(users_df.head())\n",
    "\n",
    "print(\"\\nRatings DataFrame:\")\n",
    "print(ratings_df.head())\n",
    "\n",
    "print(\"\\nMovies DataFrame:\")\n",
    "print(movies_df.head())\n",
    "\n",
    "# Optionally, convert DataFrames to NumPy arrays/matrices\n",
    "users_array = users_df.values\n",
    "ratings_array = ratings_df.values\n",
    "movies_array = movies_df.values\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df = pd.merge(ratings_df, movies_df)[['user_id', 'title', 'rating', 'timestamp']]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df[\"user_id\"] = ratings_df[\"user_id\"].astype(str)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "General Dataset Statistics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_user = ratings_df.groupby('user_id').rating.count()\n",
    "ratings_per_item = ratings_df.groupby('title').rating.count()\n",
    "\n",
    "print(f\"Total No. of users: {len(ratings_df.user_id.unique())}\")\n",
    "print(f\"Total No. of items: {len(ratings_df.title.unique())}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max observed rating: {ratings_df.rating.max()}\")\n",
    "print(f\"Min observed rating: {ratings_df.rating.min()}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max no. of user ratings: {ratings_per_user.max()}\")\n",
    "print(f\"Min no. of user ratings: {ratings_per_user.min()}\")\n",
    "print(f\"Median no. of ratings per user: {ratings_per_user.median()}\")\n",
    "print(\"\\n\")\n",
    "\n",
    "print(f\"Max no. of item ratings: {ratings_per_item.max()}\")\n",
    "print(f\"Min no. of item ratings: {ratings_per_item.min()}\")\n",
    "print(f\"Median no. of ratings per item: {ratings_per_item.median()}\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lookup = {v: i+1 for i, v in enumerate(ratings_df['user_id'].unique())}\n",
    "user_lookup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "movie_lookup = {v: i+1 for i, v in enumerate(ratings_df['title'].unique())}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df['movie_id'] = ratings_df['title'].map(movie_lookup)\n",
    "ratings_df['user_int'] = ratings_df['user_id'].map(user_lookup)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_ratings_per_item = ratings_per_item.sort_values(ascending=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_ratings_per_item[:10] #top 10 most popular items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "plt.figure(figsize=(8, 6))\n",
    "plt.hist(ratings_df['rating'], bins=[0.5, 1.5, 2.5, 3.5, 4.5, 5.5], edgecolor='black', alpha=0.7, rwidth=0.8)\n",
    "plt.title('Distribution of Ratings')\n",
    "plt.xlabel('Rating')\n",
    "plt.ylabel('Number of Ratings')\n",
    "plt.xticks([1, 2, 3, 4, 5])\n",
    "plt.grid(axis='y', linestyle='--', alpha=0.7)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_item = ratings_df['movie_id'].value_counts()\n",
    "\n",
    "# Plot long tail curve\n",
    "plt.figure(figsize=(10, 6))\n",
    "plt.plot(ratings_per_item.values, color='blue', marker='o', linestyle='-', linewidth=2, markersize=5)\n",
    "plt.title('Long Tail Curve: Number of Ratings per Movie')\n",
    "plt.xlabel('Movie Index (sorted by popularity)')\n",
    "plt.ylabel('Number of Ratings')\n",
    "#plt.xscale('log') \n",
    "plt.grid(axis='y', linestyle='--', alpha=0.7)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_user = ratings_df['user_int'].value_counts()\n",
    "\n",
    "plt.figure(figsize=(10, 6))\n",
    "plt.plot(ratings_per_user.values, color='green', marker='o', linestyle='-', linewidth=2, markersize=5)\n",
    "plt.title('Long Tail Curve: Number of Ratings per User')\n",
    "plt.xlabel('User Index (sorted by activity)')\n",
    "plt.ylabel('Number of Ratings')\n",
    "#plt.xscale('log')\n",
    "plt.grid(axis='y', linestyle='--', alpha=0.7)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Popularity Bias check"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_item_rating_tuples = ratings_df[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(ratings_df[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "#model = SVD(biased=False)\n",
    "\n",
    "# # Perform cross-validation\n",
    "# cv_results = cross_validate(model, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# # Print the cross-validation results\n",
    "# for measure in ['test_rmse', 'test_mae']:\n",
    "#     print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "# model.fit(trainset)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from surprise import dump\n",
    "\n",
    "# # Assuming you have already trained a model 'algo'\n",
    "# # Define the file path to save the model\n",
    "# file_path = 'surprise_model_full.dump'\n",
    "\n",
    "# # Save the model\n",
    "# dump.dump(file_path, algo=model)\n",
    "\n",
    "# # You can also save additional data along with the model\n",
    "# # For example, if you want to save the dataset used for training:\n",
    "# # dump.dump(file_path, algo=model, trainset=trainset)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "# Define the file path where the model dump is saved\n",
    "file_path = 'surprise_model_full.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Leave 1 out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )\n",
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df\n",
    "mark_last_n_ratings_as_validation_set(ratings_df, 1)\n",
    "train_df = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(train_df[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "# model_last_item = SVD(biased=False)\n",
    "\n",
    "# Perform cross-validation\n",
    "# cv_results = cross_validate(model_last_item, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# Print the cross-validation results\n",
    "# for measure in ['test_rmse', 'test_mae']:\n",
    "#     print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset1 = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "# model_last_item.fit(trainset1)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from surprise import dump\n",
    "\n",
    "# # Assuming you have already trained a model 'algo'\n",
    "# # Define the file path to save the model\n",
    "# file_path = 'surprise_model_last_item.dump'\n",
    "\n",
    "# # Save the model\n",
    "# dump.dump(file_path, algo=model_last_item)\n",
    "\n",
    "# # You can also save additional data along with the model\n",
    "# # For example, if you want to save the dataset used for training:\n",
    "# # dump.dump(file_path, algo=model, trainset=trainset)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "# Define the file path where the model dump is saved\n",
    "file_path = 'surprise_model_last_item.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model_last_item = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Leave 5 out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )\n",
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df\n",
    "mark_last_n_ratings_as_validation_set(ratings_df, 5)\n",
    "train_df_5 = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df_5 = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(train_df_5[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "# model_last_five = SVD(biased=False)\n",
    "\n",
    "# Perform cross-validation\n",
    "# cv_results = cross_validate(model_last_five, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# # Print the cross-validation results\n",
    "# for measure in ['test_rmse', 'test_mae']:\n",
    "#     print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset5 = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "# model_last_five.fit(trainset5)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from surprise import dump\n",
    "\n",
    "# # Assuming you have already trained a model 'algo'\n",
    "# # Define the file path to save the model\n",
    "# file_path = 'surprise_model_last_five.dump'\n",
    "\n",
    "# # Save the model\n",
    "# dump.dump(file_path, algo=model_last_five)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "# Define the file path where the model dump is saved\n",
    "file_path = 'surprise_model_last_five.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model_last_five = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from surprise import Dataset, Reader\n",
    "# from surprise.model_selection import train_test_split\n",
    "# from surprise import SVD\n",
    "# from surprise import accuracy\n",
    "\n",
    "# # Load the MovieLens 1M dataset\n",
    "# # Make sure to replace 'path/to/movielens-1m/ratings.dat' with the actual path to your MovieLens 1M dataset file\n",
    "# reader = Reader(line_format='user item rating timestamp', sep='::')\n",
    "# data = Dataset.load_from_file('../datasets/ml-1m/ratings.dat', reader)\n",
    "\n",
    "# # Split the dataset into training and testing sets\n",
    "# trainset, testset = train_test_split(data, test_size=0.2)\n",
    "\n",
    "# # Choose the SVD model\n",
    "# model = SVD(biased=False)\n",
    "\n",
    "# # Train the model\n",
    "# model.fit(trainset)\n",
    "\n",
    "# # Make predictions on the test set\n",
    "# predictions = model.test(testset)\n",
    "\n",
    "# # Evaluate the model\n",
    "# accuracy.rmse(predictions)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the user-item rating matrix from the trainset\n",
    "user_item_matrix = trainset.ur\n",
    "total_triplets = sum(len(items) for items in user_item_matrix.values())\n",
    "\n",
    "print(\"Total Triplets:\", total_triplets)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(model.pu)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(model.qi)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# np.save('uservectors', model.pu)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# file = open('items_rated', 'wb')\n",
    "\n",
    "# # dump information to that file\n",
    "# pickle.dump(trainset.ur, file)\n",
    "\n",
    "# # close the file\n",
    "# file.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# np.save('itemvectors', model.qi)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Now to create the same lists we created earlier\n",
    "#already_rated list\n",
    "#popularity ranking list\n",
    "from collections import defaultdict\n",
    "\n",
    "item_occurrences = defaultdict(int)\n",
    "for items in user_item_matrix.values():\n",
    "    for item, _ in items:\n",
    "        item_occurrences[item] += 1\n",
    "\n",
    "# Step 2: Sort items by popularity\n",
    "sorted_items = sorted(item_occurrences.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "# Step 3: Assign ranks to items\n",
    "popularity_rank = {item: rank + 1 for rank, (item, _) in enumerate(sorted_items)}\n",
    "\n",
    "# Print the popularity ranks\n",
    "# for item, rank in popularity_rank.items():\n",
    "#     print(f\"Item {item} has popularity rank {rank}\")\n",
    "sorted_items[:10]\n",
    "#popularity_rank"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "thirty_most_popular = []\n",
    "for i, j in sorted_items[:30]:\n",
    "    thirty_most_popular.append(i)\n",
    "    \n",
    "thirty_least_popular = []\n",
    "for i,j in sorted_items[:-30]:\n",
    "    thirty_least_popular.append(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "user_item_rating_dict = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in user_item_matrix.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# file = open('ui_rating_dict', 'wb')\n",
    "\n",
    "# # dump information to that file\n",
    "# pickle.dump(user_item_rating_dict, file)\n",
    "\n",
    "# # close the file\n",
    "# file.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.shape(model.pu[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.shape(model.qi[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.dot(model.pu[0],model.qi[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_items = len(model.qi)\n",
    "n_users = len(model.pu)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendations(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ model.qi[item]\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendation_scores(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ model.qi[item]\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    top_10_item_scores=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        item_score = i[1]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "            top_10_item_scores.append(item_score)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names, top_10_item_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "get_recommendations(model.pu[0], list(user_item_rating_dict[0].keys()))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_popularity(recommendations):\n",
    "    total_popularity=0\n",
    "    for i in recommendations:\n",
    "        total_popularity+=popularity_rank[i]\n",
    "        #print(popularity_dict[i])\n",
    "    return total_popularity/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_vector(user_vector, items, ratings):\n",
    "    Q_list = [model.qi[item] for item in items]\n",
    "    Q = np.array(Q_list)\n",
    "    p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=20"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Start with uniform choice and positive feedback models\n",
    "#As neither present any systematic user preference, any change in trajectory popularity cannot be attributed to the user.\n",
    "from tqdm import tqdm\n",
    "time_max=150\n",
    "avg_popularity=[]\n",
    "user_vector = model.pu[uid]\n",
    "already_rated = list(user_item_rating_dict[uid].keys())\n",
    "ratings = user_item_rating_dict[uid]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    avg_popularity.append(get_popularity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_users"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "popularity_all_users=[]\n",
    "for i in tqdm(range(0,200)): #n_users\n",
    "    time_max=150\n",
    "    uid=i\n",
    "    popularity_all_users.append([])\n",
    "    #avg_popularity=[]\n",
    "    user_vector = model.pu[uid]\n",
    "    already_rated = list(user_item_rating_dict[uid].keys())\n",
    "    ratings = user_item_rating_dict[uid]\n",
    "    for timestep in range(1, time_max+1):\n",
    "        recommendations = get_recommendations(user_vector, already_rated)\n",
    "        popularity_all_users[i].append(get_popularity(recommendations))\n",
    "        choice_of_item = recommendations[0]\n",
    "        ratings[choice_of_item] = 5\n",
    "        already_rated.append(choice_of_item)\n",
    "        user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_popularity=[]\n",
    "for i in range(0,150):\n",
    "    curr_sum=sum(popularity_all_users[j][i] for j in range(0,200))/200\n",
    "    avg_popularity.append(curr_sum)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_popularity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#first 200 users\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Diversity Bias\n",
    "#Basically the same, find the diversity of the recommendation list\n",
    "#What metric do you use for diversity? Distance between the latent representations of items?\n",
    "#1 - cosine_similarity\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "import itertools\n",
    "\n",
    "def compute_diversity(rec_list):\n",
    "    item_embeddings = [model.qi[item] for item in rec_list]\n",
    "    #print(item_embeddings)\n",
    "    cosine_similarities = cosine_similarity(item_embeddings, item_embeddings)\n",
    "    cosine_similarities_flat = cosine_similarities[np.triu_indices(len(rec_list), k=1)]\n",
    "    one_minus_cosine_similarities = 1 - cosine_similarities_flat\n",
    "    # Compute the average\n",
    "    average_diversity = one_minus_cosine_similarities.mean()\n",
    "    return average_diversity\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "diversity_popular = compute_diversity(thirty_most_popular)\n",
    "diversity_unpopular = compute_diversity(thirty_least_popular)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "overall_diversity = compute_diversity(list(item_occurrences.keys()))\n",
    "print(\"Overall Diversity:\", overall_diversity)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(\"Diversity among most popular items:\", diversity_popular)\n",
    "print(\"Diversity among least popular items:\", diversity_unpopular)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from tqdm import tqdm\n",
    "diversity_per_popular = [] #after every 30 items\n",
    "for i in tqdm(range(30, n_items, 30)):\n",
    "    diversity_per_popular.append(compute_diversity([sorted_items[:i][j][0] for j in range(i)]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#plot for diversity as you increase the field of items, starting from the 30 most popular items\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "x_data = [i+1 for i in range(len(diversity_per_popular))]\n",
    "x_data = [i*30 for i in x_data]\n",
    "plt.plot(x_data, diversity_per_popular, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('k')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity of Top-k items by Popularity')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "diversity_all_users=[]\n",
    "for i in tqdm(range(0,200)): #n_users\n",
    "    time_max=150\n",
    "    uid=i\n",
    "    diversity_all_users.append([])\n",
    "    # diversity=[]\n",
    "    user_vector = model.pu[uid]\n",
    "    already_rated = list(user_item_rating_dict[uid].keys())\n",
    "    ratings = user_item_rating_dict[uid]\n",
    "    for timestep in range(1, time_max+1):\n",
    "        recommendations = get_recommendations(user_vector, already_rated)\n",
    "        diversity_all_users[i].append(compute_diversity(recommendations))\n",
    "        choice_of_item = recommendations[0]\n",
    "        ratings[choice_of_item] = 5\n",
    "        already_rated.append(choice_of_item)\n",
    "        user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_diversity=[]\n",
    "for i in range(0,150):\n",
    "    curr_sum=sum(diversity_all_users[j][i] for j in range(0,200))/200\n",
    "    avg_diversity.append(curr_sum)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "uid = 20\n",
    "time_max=150\n",
    "diversity=[]\n",
    "user_vector = model.pu[uid]\n",
    "already_rated = list(user_item_rating_dict[uid].keys())\n",
    "ratings = user_item_rating_dict[uid]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    diversity.append(compute_diversity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "uid = 20\n",
    "time_max=150\n",
    "diversity=[]\n",
    "user_vector = model.pu[uid]\n",
    "already_rated = list(user_item_rating_dict[uid].keys())\n",
    "ratings = user_item_rating_dict[uid]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    diversity.append(compute_diversity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 1\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "diversity_all_users=[]\n",
    "for i in tqdm(range(0,200)): #n_users\n",
    "    time_max=150\n",
    "    uid=i\n",
    "    diversity_all_users.append([])\n",
    "    # diversity=[]\n",
    "    user_vector = model.pu[uid]\n",
    "    already_rated = list(user_item_rating_dict[uid].keys())\n",
    "    ratings = user_item_rating_dict[uid]\n",
    "    for timestep in range(1, time_max+1):\n",
    "        recommendations = get_recommendations(user_vector, already_rated)\n",
    "        diversity_all_users[i].append(compute_diversity(recommendations))\n",
    "        choice_of_item = recommendations[0]\n",
    "        ratings[choice_of_item] = 1\n",
    "        already_rated.append(choice_of_item)\n",
    "        user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_diversity=[]\n",
    "for i in range(0,150):\n",
    "    curr_sum=sum(diversity_all_users[j][i] for j in range(0,200))/200\n",
    "    avg_diversity.append(curr_sum)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Self-Trained Model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "\n",
    "class MfDotBias(nn.Module):\n",
    "\n",
    "    def __init__(\n",
    "        self, n_factors, n_users, n_items, ratings_range=None, use_biases=False\n",
    "    ):\n",
    "        super().__init__()\n",
    "        self.bias = use_biases\n",
    "        self.y_range = ratings_range\n",
    "        self.user_embedding = nn.Embedding(n_users+1, n_factors, padding_idx=0)\n",
    "        self.item_embedding = nn.Embedding(n_items+1, n_factors, padding_idx=0)\n",
    "\n",
    "        if use_biases:\n",
    "            self.user_bias = nn.Embedding(n_users+1, 1, padding_idx=0)\n",
    "            self.item_bias = nn.Embedding(n_items+1, 1, padding_idx=0)\n",
    "\n",
    "    def forward(self, inputs):\n",
    "        users, items = inputs\n",
    "        dot = self.user_embedding(users) * self.item_embedding(items)\n",
    "        result = dot.sum(1)\n",
    "        if self.bias:\n",
    "            result = (\n",
    "                result + self.user_bias(users).squeeze() + self.item_bias(items).squeeze()\n",
    "            )\n",
    "\n",
    "        if self.y_range is None:\n",
    "            return result\n",
    "        else:\n",
    "            return (\n",
    "                torch.sigmoid(result) * (self.y_range[1] - self.y_range[0])\n",
    "                + self.y_range[0]\n",
    "            )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from tqdm import tqdm\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# # Convert datasets to PyTorch tensors\n",
    "# train_data = torch.tensor(user_item_rating_tuples, dtype=torch.long)\n",
    "# valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into training and validation sets\n",
    "train_data, valid_data = train_test_split(user_item_rating_tuples, test_size=0.2, random_state=42)\n",
    "\n",
    "# Convert the lists to PyTorch tensors\n",
    "train_data = torch.tensor(train_data, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_data, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 100  # Adjust as needed\n",
    "n_users = train_users.max().item() + 1\n",
    "print(\"Number of users:\", n_users)\n",
    "n_items = train_items.max().item() + 1\n",
    "print(\"Number of items:\", n_items)\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "print(\"Shape of dataset: \", len(train_dataset))\n",
    "print(\"Length of train loader: \", len(train_loader))\n",
    "# Training loop\n",
    "n_epochs = 20  # Adjust as needed\n",
    "\n",
    "# best_valid_loss = float('inf')\n",
    "# patience = 3  # Adjust as needed\n",
    "# counter = 0\n",
    "\n",
    "# for epoch in range(n_epochs):\n",
    "#     model.train()\n",
    "#     for batch_users, batch_items, batch_ratings in tqdm(train_loader):\n",
    "#         optimizer.zero_grad()\n",
    "#         predictions = model((batch_users, batch_items))\n",
    "#         loss = criterion(predictions, batch_ratings.float())\n",
    "#         loss.backward()\n",
    "#         optimizer.step()\n",
    "\n",
    "#     #Validation\n",
    "#     model.eval()\n",
    "#     with torch.no_grad():\n",
    "#         valid_predictions = model((valid_users, valid_items))\n",
    "#         valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "#     print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "#     if valid_loss < best_valid_loss:\n",
    "#         best_valid_loss = valid_loss\n",
    "#         counter = 0  # Reset counter if validation loss improves\n",
    "#     else:\n",
    "#         counter += 1\n",
    "\n",
    "#     if counter >= patience:\n",
    "#         print(f'Validation loss did not improve for {patience} epochs. Stopping training.')\n",
    "#         break\n",
    "\n",
    "# # Optionally, save the trained model\n",
    "# torch.save(model.state_dict(), 'test_model_1.pth')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.load_state_dict(torch.load('model_50_epochs.pth'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create a dictionary to store user-item mappings\n",
    "user_item_dict = {}\n",
    "# Iterate through train_data and collect items for each user\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id.item() not in user_item_dict:\n",
    "        user_item_dict[user_id.item()] = [item_id.item()]\n",
    "    else:\n",
    "        user_item_dict[user_id.item()].append(item_id.item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Testing\n",
    "model.user_embedding(torch.tensor(6041))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.item_embedding(torch.tensor(1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.is_available()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.device_count()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.current_device()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.get_device_name(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from collections import defaultdict\n",
    "ratings_per_item = defaultdict(int)\n",
    "\n",
    "for item_id in train_items:\n",
    "    ratings_per_item[item_id.item()]+=1\n",
    "    \n",
    "ratings_per_item = dict(ratings_per_item)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_user = defaultdict(int)\n",
    "\n",
    "for user_id in train_users:\n",
    "    ratings_per_user[user_id.item()]+=1\n",
    "    \n",
    "ratings_per_user = dict(ratings_per_user)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from collections import defaultdict\n",
    "# ratings_per_item_lookup = defaultdict(int)\n",
    "# for item_name, num_ratings in ratings_per_item.items():\n",
    "#     item_number = movie_lookup.get(item_name)\n",
    "#     if item_number is not None:\n",
    "#         ratings_per_item_lookup[item_number] += num_ratings\n",
    "\n",
    "# # Convert defaultdict to a regular dictionary\n",
    "# ratings_per_item_lookup = dict(ratings_per_item_lookup)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in ratings_per_item.items():\n",
    "    print(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_items_by_ratings = sorted(ratings_per_item.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "# Create a popularity_dict based on the sorted list\n",
    "popularity_dict = {item: rank for rank, (item, count) in enumerate(sorted_items_by_ratings, start=1)}\n",
    "\n",
    "print(\"Popularity dictionary:\", popularity_dict)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "popularity_list = list(popularity_dict.keys())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Predicted rating for user 25 on item 5\n",
    "inp = [torch.tensor([25]), torch.tensor([5])]\n",
    "print(model(inp).item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Consider user no. 25\n",
    "predicted_ratings = {index: None for index in range(1, n_items + 1)}\n",
    "for item in range(1, n_items+1):\n",
    "    item_rating = model([torch.tensor([25]), torch.tensor([item])]).item()\n",
    "    predicted_ratings[item] = item_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "count_var = 0\n",
    "top_10_item_names=[]\n",
    "for i in sorted_pred_ratings:\n",
    "    item_id = i[0]\n",
    "    if item_id not in user_item_dict[25]:\n",
    "        count_var+=1\n",
    "        top_10_item_names.append(item_id)\n",
    "    if count_var==10:\n",
    "        break\n",
    "print(top_10_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#See average popularity of initial recommendations\n",
    "#Let's take a random user, say 25\n",
    "total_popularity=0\n",
    "for i in top_10_item_names:\n",
    "    total_popularity+=popularity_dict[i]\n",
    "    #print(popularity_dict[i])\n",
    "print(total_popularity/10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.user_embedding(torch.tensor([25]))[0]#.detach().numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_list = []\n",
    "for item in train_items.unique():\n",
    "    item_list.append(item.item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendations(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in item_list}\n",
    "    for item in item_list:\n",
    "        dot = user_vector * model.item_embedding(torch.tensor([item]))\n",
    "        result = dot.sum(1)\n",
    "        # result = (\n",
    "        #     result + model.user_bias(torch.tensor([uid])).squeeze() + model.item_bias(torch.tensor([item])).squeeze()\n",
    "        # )\n",
    "        item_rating = result.item()\n",
    "        #item_rating = model([torch.tensor([uid]), torch.tensor([item])]).item()\n",
    "        predicted_ratings[item] = item_rating\n",
    "    # for i in predicted_ratings:\n",
    "    #     if predicted_ratings[i]==None:\n",
    "    #         print(i)\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendation_scores(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in item_list}\n",
    "    for item in item_list:\n",
    "        dot = user_vector * model.item_embedding(torch.tensor([item]))\n",
    "        result = dot.sum(1)\n",
    "        # result = (\n",
    "        #     result + model.user_bias(torch.tensor([uid])).squeeze() + model.item_bias(torch.tensor([item])).squeeze()\n",
    "        # )\n",
    "        item_rating = result.item()\n",
    "        #item_rating = model([torch.tensor([uid]), torch.tensor([item])]).item()\n",
    "        predicted_ratings[item] = item_rating\n",
    "    # for i in predicted_ratings:\n",
    "    #     if predicted_ratings[i]==None:\n",
    "    #         print(i)\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    top_10_item_scores=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        item_score = i[1]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "            top_10_item_scores.append(item_score)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names, top_10_item_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_popularity(recommendations):\n",
    "    total_popularity=0\n",
    "    for i in recommendations:\n",
    "        total_popularity+=popularity_dict[i]\n",
    "        #print(popularity_dict[i])\n",
    "    return total_popularity/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#torch.tensor([25]), torch.tensor([5])\n",
    "dot = model.user_embedding(torch.tensor([25])) * model.item_embedding(torch.tensor([5]))\n",
    "result = dot.sum(1)\n",
    "# result = (\n",
    "#     result + model.user_bias(torch.tensor([25])).squeeze() + model.item_bias(torch.tensor([5])).squeeze()\n",
    "# )\n",
    "print(result.item())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def calculate_error(user_vector, ratings):\n",
    "#     error_sum = 0\n",
    "#     for item, rating in ratings.items():\n",
    "#         item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "#         error_sum += (torch.dot(user_vector, item_vector) - rating)**2\n",
    "#     return error_sum\n",
    "\n",
    "# def update_user_latent_vector(user_vector, item_vectors, ratings, learning_rate):\n",
    "#     error_sum = 0\n",
    "#     for item, rating in ratings.items():\n",
    "#         item_vector = model.item_embedding(torch.tensor([item]))[0]\n",
    "#         error_sum += 2 * (torch.dot(user_vector, item_vector) - rating) * item_vector\n",
    "#     gradient = error_sum\n",
    "#     updated_user_vector = user_vector - learning_rate * gradient\n",
    "#     return updated_user_vector\n",
    "\n",
    "# def update_user_vector(user_vector, ratings, learning_rate=0.01, max_iterations=100, convergence_threshold=1e-5):\n",
    "#     prev_error = float('inf')\n",
    "#     for iteration in range(max_iterations):\n",
    "#         error = calculate_error(user_vector, ratings)\n",
    "#         #print(prev_error - error)\n",
    "#         if abs(prev_error - error) < convergence_threshold:\n",
    "#             break\n",
    "        \n",
    "#         user_vector = update_user_latent_vector(user_vector, model.item_embedding, ratings, learning_rate)\n",
    "#         prev_error = error\n",
    "#     return user_vector\n",
    "\n",
    "#closed form expression\n",
    "def update_user_vector(user_vector, items, ratings):\n",
    "    Q_list = [model.item_embedding(torch.tensor([item]))[0].detach().numpy() for item in items]\n",
    "    Q = np.array(Q_list)\n",
    "    p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.tensor(p)\n",
    "    return p\n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=25\n",
    "ratings={}\n",
    "already_rated=[]\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id!=uid:\n",
    "        continue\n",
    "    ratings[item_id.item()] = rating.item()\n",
    "    already_rated.append(item_id.item())\n",
    "print(\"Ratings acquired\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#define user_type.choice\n",
    "#define user_type.rating\n",
    "import random\n",
    "class UserType:\n",
    "    def __init__(self, user_type, rec_scores, popularities, beta=0):\n",
    "        self.user_type = user_type\n",
    "        self.rec_scores = rec_scores\n",
    "        self.popularities = popularities\n",
    "        self.beta = beta\n",
    "        self.set_user_type_values()\n",
    "\n",
    "    def set_user_type_values(self):\n",
    "        if self.user_type == \"Enjoyer\":\n",
    "            self.item_choice = 0\n",
    "            self.item_rating = 5\n",
    "        elif self.user_type == \"Hater\":\n",
    "            self.item_choice = 0\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Random Enjoyer\":\n",
    "            self.item_choice = random.randint(0, len(self.rec_scores) - 1)\n",
    "            self.item_rating = 5\n",
    "        elif self.user_type == \"Random Hater\":\n",
    "            self.item_choice = random.randint(0, len(self.rec_scores) - 1)\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Choice Enjoyer\":\n",
    "            # probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            # probabilities /= probabilities.sum() \n",
    "            # self.item_choice = np.random.choice(len(self.rec_scores), p=probabilities)\n",
    "            # self.item_rating = 5\n",
    "            \n",
    "            probabilities = torch.softmax(torch.mul(self.rec_scores, self.beta), dim=0)\n",
    "\n",
    "            # Choose an item based on probabilities\n",
    "            self.item_choice = torch.multinomial(probabilities, 1).item()\n",
    "\n",
    "            # Set item rating to 5\n",
    "            self.item_rating = torch.tensor(5, dtype=torch.float64)\n",
    "        elif self.user_type == \"Choice Hater\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.rec_scores), p=probabilities)\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Popular Enjoyer\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.values), p=probabilities)\n",
    "            if self.popularities[self.item_choice]<500:\n",
    "                self.item_rating = 5\n",
    "            else:\n",
    "                self.item_rating = 1\n",
    "        elif self.user_type == \"Niche Enjoyer\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.values), p=probabilities)\n",
    "            if self.popularities[self.item_choice]<500:\n",
    "                self.item_rating = 1\n",
    "            else:\n",
    "                self.item_rating = 5\n",
    "        else:\n",
    "            raise ValueError(\"Invalid user type. Please choose a valid user type.\")\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Start with uniform choice and positive feedback models\n",
    "#As neither present any systematic user preference, any change in trajectory popularity cannot be attributed to the user.\n",
    "time_max=150\n",
    "avg_popularity=[]\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "    temp_popularity = get_popularity(recommendations)\n",
    "    avg_popularity.append(temp_popularity)\n",
    "    usr_type = UserType(\"Random Enjoyer\", recommendation_scores, temp_popularity)\n",
    "    choice_of_item = recommendations[usr_type.item_choice]\n",
    "    ratings[choice_of_item] = usr_type.item_rating\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Start with uniform choice and positive feedback models\n",
    "#As neither present any systematic user preference, any change in trajectory popularity cannot be attributed to the user.\n",
    "time_max=150\n",
    "avg_popularity=[]\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    avg_popularity.append(get_popularity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "avg_popularity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 25\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 20\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(avg_popularity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Average Popularity')\n",
    "plt.title('Average Popularity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Diversity Bias\n",
    "#Basically the same, find the diversity of the recommendation list\n",
    "#What metric do you use for diversity? Distance between the latent representations of items?\n",
    "#1 - cosine_similarity\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "import itertools\n",
    "\n",
    "def compute_diversity(rec_list):\n",
    "    item_embeddings = [model.item_embedding(torch.tensor([item]))[0].detach().numpy() for item in rec_list]\n",
    "    #print(item_embeddings)\n",
    "    cosine_similarities = cosine_similarity(item_embeddings, item_embeddings)\n",
    "    cosine_similarities_flat = cosine_similarities[np.triu_indices(len(rec_list), k=1)]\n",
    "    one_minus_cosine_similarities = 1 - cosine_similarities_flat\n",
    "    # Compute the average\n",
    "    average_diversity = one_minus_cosine_similarities.mean()\n",
    "    return average_diversity\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "uid=25\n",
    "ratings={}\n",
    "already_rated=[]\n",
    "for user_id, item_id, rating in tqdm(train_data):\n",
    "    if user_id!=uid:\n",
    "        continue\n",
    "    ratings[item_id.item()] = rating.item()\n",
    "    already_rated.append(item_id.item())\n",
    "print(\"Ratings acquired\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Uniform choice and positive feedback\n",
    "#Diversity\n",
    "time_max=150\n",
    "diversity=[]\n",
    "user_vector = model.user_embedding(torch.tensor([uid]))[0]\n",
    "for timestep in tqdm(range(1, time_max+1)):\n",
    "    recommendations = get_recommendations(user_vector, already_rated)\n",
    "    diversity.append(compute_diversity(recommendations))\n",
    "    choice_of_item = recommendations[0]\n",
    "    ratings[choice_of_item] = 5\n",
    "    already_rated.append(choice_of_item)\n",
    "    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "diversity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#User 25\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(diversity, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('Timestep')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity vs. Timestep')\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(popularity_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from tqdm import tqdm\n",
    "diversity_per_popular = [] #after every 30 items\n",
    "for i in tqdm(range(30, len(popularity_list), 30)):\n",
    "    #print(popularity_list[:i])\n",
    "    diversity_per_popular.append(compute_diversity(popularity_list[:i]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#plot for diversity as you increase the field of items, starting from the 30 most popular items\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "x_data = [i+1 for i in range(len(diversity_per_popular))]\n",
    "x_data = [i*30 for i in x_data]\n",
    "plt.plot(x_data, diversity_per_popular, marker='o', linestyle='-', color='b')\n",
    "plt.xlabel('k')\n",
    "plt.ylabel('Diversity')\n",
    "plt.title('Diversity of Top-k items by Popularity')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Set the most recent interactions as the test set. Remove users that don't appear in the training set from the test set."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Step 1: Sort ratings by timestamp\n",
    "ratings_sorted = ratings_df.sort_values(by='timestamp')\n",
    "\n",
    "# Step 2: Split dataset into training and validation sets\n",
    "total_ratings = len(ratings_sorted)\n",
    "validation_size = int(0.3 * total_ratings)\n",
    "\n",
    "validation_set = ratings_sorted.tail(validation_size)\n",
    "training_set = ratings_sorted.head(total_ratings - validation_size)\n",
    "\n",
    "train_users = training_set['user_id'].unique()\n",
    "validation_set_filtered = validation_set[validation_set['user_id'].isin(train_users)]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(training_set.user_id.unique())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_user_item_rating_tuples = training_set[['user_int', 'movie_id', 'rating']].values.tolist()\n",
    "valid_user_item_rating_tuples = validation_set_filtered[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(train_user_item_rating_tuples, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 10  # Adjust as needed\n",
    "n_users = max(train_users.max(), valid_users.max()).item() + 1\n",
    "n_items = max(train_items.max(), valid_items.max()).item() + 1\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "\n",
    "# Training loop\n",
    "n_epochs = 20  # Adjust as needed\n",
    "for epoch in range(n_epochs):\n",
    "    model.train()\n",
    "    for batch_users, batch_items, batch_ratings in train_loader:\n",
    "        optimizer.zero_grad()\n",
    "        predictions = model((batch_users, batch_items))\n",
    "        loss = criterion(predictions, batch_ratings.float())\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "    # Validation\n",
    "    model.eval()\n",
    "    with torch.no_grad():\n",
    "        valid_predictions = model((valid_users, valid_items))\n",
    "        valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "    print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "# Optionally, save the trained model\n",
    "torch.save(model.state_dict(), 'mf_model.pth')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Method-2: Mark last n ratings by each user as the test set."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mark_last_n_ratings_as_validation_set(ratings_df, 1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_df = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "median_rating = train_df.rating.median()\n",
    "median_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import math\n",
    "from sklearn.metrics import mean_squared_error, mean_absolute_error\n",
    "\n",
    "predictions = np.array([median_rating]* len(valid_df))\n",
    "\n",
    "mae = mean_absolute_error(valid_df.rating, predictions)\n",
    "mse = mean_squared_error(valid_df.rating, predictions)\n",
    "rmse = math.sqrt(mse)\n",
    "\n",
    "print(f'mae: {mae}')\n",
    "print(f'mse: {mse}')\n",
    "print(f'rmse: {rmse}')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_user_item_rating_tuples = train_df[['user_int', 'movie_id', 'rating']].values.tolist()\n",
    "valid_user_item_rating_tuples = valid_df[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "train_df=train_df[['user_int', 'movie_id', 'rating']]\n",
    "valid_df=valid_df[['user_int', 'movie_id', 'rating']]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(train_user_item_rating_tuples, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "from torch.utils.data import DataLoader, TensorDataset\n",
    "from torch.optim import Adam\n",
    "from sklearn.model_selection import train_test_split\n",
    "import numpy as np\n",
    "\n",
    "# Convert datasets to PyTorch tensors\n",
    "train_data = torch.tensor(train_user_item_rating_tuples, dtype=torch.long)\n",
    "valid_data = torch.tensor(valid_user_item_rating_tuples, dtype=torch.long)\n",
    "\n",
    "# Split the data into features (users, items) and targets (ratings)\n",
    "train_users, train_items, train_ratings = train_data[:, 0], train_data[:, 1], train_data[:, 2]\n",
    "valid_users, valid_items, valid_ratings = valid_data[:, 0], valid_data[:, 1], valid_data[:, 2]\n",
    "\n",
    "# Set random seed for reproducibility\n",
    "torch.manual_seed(42)\n",
    "\n",
    "# Instantiate the matrix factorization model\n",
    "n_factors = 10  # Adjust as needed\n",
    "n_users = max(train_users.max(), valid_users.max()).item() + 1\n",
    "n_items = max(train_items.max(), valid_items.max()).item() + 1\n",
    "\n",
    "model = MfDotBias(n_factors=n_factors, n_users=n_users, n_items=n_items)\n",
    "\n",
    "# Define loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = Adam(model.parameters(), lr=0.001)\n",
    "\n",
    "# Convert datasets to DataLoader for batch training\n",
    "batch_size = 64  # Adjust as needed\n",
    "train_dataset = TensorDataset(train_users, train_items, train_ratings)\n",
    "train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)\n",
    "\n",
    "# Training loop\n",
    "n_epochs = 20  # Adjust as needed\n",
    "for epoch in range(n_epochs):\n",
    "    model.train()\n",
    "    for batch_users, batch_items, batch_ratings in train_loader:\n",
    "        optimizer.zero_grad()\n",
    "        predictions = model((batch_users, batch_items))\n",
    "        loss = criterion(predictions, batch_ratings.float())\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "    # Validation\n",
    "    model.eval()\n",
    "    with torch.no_grad():\n",
    "        valid_predictions = model((valid_users, valid_items))\n",
    "        valid_loss = criterion(valid_predictions, valid_ratings.float())\n",
    "\n",
    "    print(f'Epoch {epoch + 1}/{n_epochs}, Loss: {loss.item()}, Validation Loss: {valid_loss.item()}')\n",
    "\n",
    "# Optionally, save the trained model\n",
    "torch.save(model.state_dict(), 'mf_model.pth')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Recurrent Recommender Network"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# -*- Encoding:UTF-8 -*-\n",
    "\n",
    "import pandas as pd\n",
    "\n",
    "\n",
    "class Data:\n",
    "    def __init__(self, name='ml-1m'):\n",
    "        self.dataName = name\n",
    "        self.dataPath = \"../datasets/\" + self.dataName + \"/\"\n",
    "        # Static Profile\n",
    "        self.UserInfo = self.getUserInfo()\n",
    "        self.MovieInfo = self.getMovieInfo()\n",
    "\n",
    "        self.data = self.getData()\n",
    "\n",
    "    def getUserInfo(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            userInfoPath = self.dataPath + \"users.dat\"\n",
    "\n",
    "            users_title = ['UserID', 'Gender', 'Age', 'JobID', 'Zip-code']\n",
    "            users = pd.read_table(userInfoPath, sep='::', header=None, names=users_title, engine='python', encoding='latin-1')\n",
    "            users = users.filter(regex='UserID|Gender|Age|JobID')\n",
    "            users_orig = users.values\n",
    "\n",
    "            gender_map = {'F': 0, 'M': 1}\n",
    "            users['Gender'] = users['Gender'].map(gender_map)\n",
    "            age_map = {val: idx for idx, val in enumerate(set(users['Age']))}\n",
    "            users['Age'] = users['Age'].map(age_map)\n",
    "\n",
    "            return users\n",
    "\n",
    "    def getMovieInfo(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            movieInfoPath = self.dataPath + \"movies.dat\"\n",
    "\n",
    "            movies_title = ['MovieID', 'Title', 'Genres']\n",
    "            movies = pd.read_table(movieInfoPath, sep='::', header=None, names=movies_title, engine='python', encoding='latin-1')\n",
    "            movies = movies.filter(regex='MovieID|Genres')\n",
    "\n",
    "            genres_set = set()\n",
    "            for val in movies['Genres'].str.split('|'):\n",
    "                genres_set.update(val)\n",
    "            genres2int = {val: idx for idx, val in enumerate(genres_set)}\n",
    "            genres_map = {val: [genres2int[row] for row in val.split('|')] for ii, val in enumerate(set(movies['Genres']))}\n",
    "            movies['Genres'] = movies['Genres'].map(genres_map)\n",
    "\n",
    "            return movies\n",
    "\n",
    "    def getData(self):\n",
    "        if self.dataName == \"ml-1m\":\n",
    "            dataPath = self.dataPath + \"ratings.dat\"\n",
    "\n",
    "            ratings_title = ['UserID', 'MovieID', 'Rating', 'TimeStamp']\n",
    "            ratings = pd.read_table(dataPath, sep='::', header=None, names=ratings_title, engine='python', encoding='latin-1')\n",
    "\n",
    "            data = pd.merge(pd.merge(ratings, self.UserInfo), self.MovieInfo)\n",
    "            data = data.sort_values(by=['TimeStamp'])\n",
    "            #print(data.head())\n",
    "\n",
    "            # Step 1: Sort ratings by timestamp\n",
    "\n",
    "            # Step 2: Split dataset into training and validation sets\n",
    "            total_ratings = len(data)\n",
    "            validation_size = int(0.3 * total_ratings)\n",
    "\n",
    "            validation_set = data.tail(validation_size)\n",
    "            training_set = data.head(total_ratings - validation_size)\n",
    "\n",
    "            \n",
    "            train_users = training_set['UserID'].unique()\n",
    "            validation_set_filtered = validation_set[validation_set['UserID'].isin(train_users)]\n",
    "            \n",
    "            return training_set, validation_set_filtered\n",
    "\n",
    "if __name__ == '__main__':\n",
    "    data = Data()\n",
    "    a, b = data.data\n",
    "    print(len(a))\n",
    "    print(len(b))\n",
    "    print(len(data.data))\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# -*- Encoding:UTF-8 -*-\n",
    "\n",
    "import tensorflow.compat.v1 as tf\n",
    "tf.disable_v2_behavior()\n",
    "import numpy as np\n",
    "import sys\n",
    "tf.reset_default_graph()\n",
    "\n",
    "\n",
    "def main():\n",
    "    model = RRN()\n",
    "    model.run()\n",
    "\n",
    "\n",
    "class RRN:\n",
    "    def __init__(self):\n",
    "        # params parser\n",
    "        self.batch_size = 50\n",
    "        self.n_step = 1\n",
    "        self.lr = 0.0001\n",
    "        self.verbose = 100\n",
    "        # Data\n",
    "        dataSet = Data(\"ml-1m\")\n",
    "        a, b = dataSet.data\n",
    "        self.train=a.values\n",
    "        self.valid=b.values\n",
    "        # Model\n",
    "        #wandb.init()\n",
    "        self.add_placeholder()\n",
    "        self.add_embedding_layer()\n",
    "        self.add_rnn_layer()\n",
    "        self.add_pred_layer()\n",
    "        self.add_loss()\n",
    "        self.add_train_step()\n",
    "        self.init_session()\n",
    "        self.saver = tf.train.Saver()\n",
    "        \n",
    "    def save_model(self):\n",
    "        # Save the model\n",
    "        model_path = \"rrn_model_3.ckpt\"\n",
    "        self.saver.save(self.sess, model_path)\n",
    "        print(f\"Model saved at {model_path}\")\n",
    "\n",
    "    def add_placeholder(self):\n",
    "        # user placeholder\n",
    "        self.userID = tf.placeholder(tf.int32, shape=[None, 1], name=\"userID\")\n",
    "        # movie placeholder\n",
    "        self.movieID = tf.placeholder(tf.int32, shape=[None, 1], name=\"movieID\")\n",
    "        # target\n",
    "        self.rating = tf.placeholder(tf.float32, shape=[None, 1], name=\"rating\")\n",
    "        # other params\n",
    "        self.dropout = tf.placeholder(tf.float32, name='dropout')\n",
    "\n",
    "    def add_embedding_layer(self):\n",
    "        with tf.name_scope(\"userID_embedding\"):\n",
    "            # user id embedding\n",
    "            uid_onehot = tf.reshape(tf.one_hot(self.userID, 6040), shape=[-1, 6040])\n",
    "            #print(uid_onehot)\n",
    "            print(\"uid one hot shape\", uid_onehot.get_shape())\n",
    "            # uid_onehot_rating = tf.multiply(self.rating, uid_onehot)\n",
    "            uid_layer = tf.layers.dense(uid_onehot, units=128, activation=tf.nn.relu)\n",
    "            print(\"uid layer shape\", uid_layer.get_shape())\n",
    "            self.uid_layer = tf.reshape(uid_layer, [-1, self.n_step, 128])\n",
    "            print(\"self uid layer shape\", self.uid_layer.get_shape())\n",
    "            #print shape\n",
    "\n",
    "        with tf.name_scope(\"movie_embedding\"):\n",
    "            # movie id embedding\n",
    "            mid_onehot = tf.reshape(tf.one_hot(self.movieID, 3706), shape=[-1, 3706])\n",
    "            # mid_onehot_rating = tf.multiply(self.rating, mid_onehot)\n",
    "            mid_layer = tf.layers.dense(mid_onehot, units=128, activation=tf.nn.relu)\n",
    "            self.mid_layer = tf.reshape(mid_layer, shape=[-1, self.n_step, 128])\n",
    "\n",
    "    def add_rnn_layer(self):\n",
    "        with tf.variable_scope(\"user_rnn_cell\"):\n",
    "            userCell = tf.nn.rnn_cell.GRUCell(num_units=128)\n",
    "\n",
    "            userInput = tf.transpose(self.uid_layer, [1, 0, 2])\n",
    "            print(\"user input shape\", userInput.get_shape())\n",
    "            # userInput = tf.reshape(userInput, [-1, 128])\n",
    "            # userInput = tf.split(userInput, self.n_step, axis=0)\n",
    "\n",
    "            userOutputs, userStates = tf.nn.dynamic_rnn(userCell, userInput, dtype=tf.float32)\n",
    "            self.userOutput = userOutputs[-1]\n",
    "            print(\"self user output shape\", self.userOutput.get_shape())\n",
    "        with tf.variable_scope(\"movie_rnn_cell\"):\n",
    "            movieCell = tf.nn.rnn_cell.GRUCell(num_units=128)\n",
    "\n",
    "            movieInput = tf.transpose(self.mid_layer, [1, 0, 2])\n",
    "            movieOutputs, movieStates = tf.nn.dynamic_rnn(movieCell, movieInput, dtype=tf.float32)\n",
    "            self.movieOutput = movieOutputs[-1]\n",
    "\n",
    "    def add_pred_layer(self):\n",
    "        W = {\n",
    "            'userOutput': tf.Variable(tf.random_normal(shape=[128, 64], stddev=0.1)),\n",
    "            'movieOutput': tf.Variable(tf.random_normal(shape=[128, 64], stddev=0.1))\n",
    "        }\n",
    "        b = {\n",
    "            'userOutput': tf.Variable(tf.random_normal(shape=[64], stddev=0.1)),\n",
    "            'movieOutput': tf.Variable(tf.random_normal(shape=[64], stddev=0.1))\n",
    "        }\n",
    "        userVector = tf.add(tf.matmul(self.userOutput, W['userOutput']), b['userOutput'])\n",
    "        movieVector = tf.add(tf.matmul(self.movieOutput, W['movieOutput']), b['movieOutput'])\n",
    "\n",
    "        self.pred = tf.reduce_sum(tf.multiply(userVector, movieVector), axis=1, keep_dims=True)\n",
    "\n",
    "    def add_loss(self):\n",
    "        losses = tf.losses.mean_squared_error(self.rating, self.pred)\n",
    "        self.loss = tf.reduce_mean(losses)\n",
    "\n",
    "    def add_train_step(self):\n",
    "        optimizer = tf.train.AdamOptimizer(self.lr)\n",
    "        self.train_op = optimizer.minimize(self.loss)\n",
    "\n",
    "    def init_session(self):\n",
    "        self.config = tf.ConfigProto()\n",
    "        self.config.gpu_options.allow_growth = True\n",
    "        self.config.allow_soft_placement = True\n",
    "        self.sess = tf.Session(config=self.config)\n",
    "        self.sess.run(tf.global_variables_initializer())\n",
    "\n",
    "    def run(self):\n",
    "        length = len(self.train)\n",
    "        batches = length // self.batch_size + 1\n",
    "\n",
    "        train_loss = []\n",
    "        valid_loss = []\n",
    "\n",
    "        for i in range(batches):\n",
    "            minIdx = i * self.batch_size\n",
    "            maxIdx = min(length, (i+1) * self.batch_size)\n",
    "            train_batch = self.train[minIdx:maxIdx]\n",
    "            feed_dict_train = self.createFeedDict(train_batch)\n",
    "\n",
    "            tmpLoss = self.sess.run(self.loss, feed_dict=feed_dict_train)\n",
    "            train_loss.append(tmpLoss)\n",
    "\n",
    "            self.sess.run(self.train_op, feed_dict=feed_dict_train)\n",
    "\n",
    "            if i % self.verbose == 0:\n",
    "                sys.stdout.write('\\rTraining: Batch {}/{} - Loss: {:.4f}'.format(\n",
    "                    i, batches, np.sqrt(np.mean(train_loss[-20:]))\n",
    "                ))\n",
    "                sys.stdout.flush()\n",
    "\n",
    "            # Check validation loss every verbose steps\n",
    "            if i % self.verbose == 0 and i != 0:\n",
    "                # Use the entire validation set\n",
    "                feed_dict_valid = self.createFeedDict(self.valid)\n",
    "                valid_loss_epoch = self.sess.run(self.loss, feed_dict=feed_dict_valid)\n",
    "                valid_loss.append(np.sqrt(valid_loss_epoch))\n",
    "                #wandb.log({\"train_loss\": np.sqrt(np.mean(train_loss[-20:])), \"valid_loss\": valid_loss[-1]})\n",
    "\n",
    "                sys.stdout.write(' - Validation Loss: {:.4f}'.format(valid_loss[-1]))\n",
    "                sys.stdout.flush()\n",
    "\n",
    "        print(\"\\nTraining Finish, Last 2000 batches loss is {}.\".format(\n",
    "            np.sqrt(np.mean(train_loss[-2000:]))\n",
    "        ))\n",
    "        feed_dict_valid = self.createFeedDict(self.valid)\n",
    "        valid_loss_epoch = self.sess.run(self.loss, feed_dict=feed_dict_valid)\n",
    "        print(\"Validation Loss: {:.4f}\".format(np.sqrt(valid_loss_epoch)))\n",
    "        self.save_model()\n",
    "\n",
    "    def createFeedDict(self, data, dropout=1.):\n",
    "        userID = []\n",
    "        movieID = []\n",
    "        ratings = []\n",
    "        for i in data:\n",
    "            userID.append([i[0]-1])\n",
    "            movieID.append([i[1]-1])\n",
    "            ratings.append([float(i[2])])\n",
    "        return {\n",
    "            self.userID: np.array(userID),\n",
    "            self.movieID: np.array(movieID),\n",
    "            self.rating: np.array(ratings),\n",
    "            self.dropout: dropout\n",
    "        }\n",
    "\n",
    "if __name__ == '__main__':\n",
    "    main()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import torch.nn.functional as F\n",
    "import pandas as pd\n",
    "from tqdm import tqdm\n",
    "\n",
    "class YourRecommender(nn.Module):\n",
    "    def __init__(self, num_users, num_items, embedding_dim, lambda_reg):\n",
    "        super(YourRecommender, self).__init__()\n",
    "        # Define your model components here, including RNN, embeddings, etc.\n",
    "        # ...\n",
    "\n",
    "        self.embedding_dim = embedding_dim\n",
    "\n",
    "        # User embedding using RNN\n",
    "        self.rnn = nn.GRU(input_size=num_items, hidden_size=embedding_dim, batch_first=True)\n",
    "\n",
    "        # Item embedding\n",
    "        self.item_embedding = nn.Embedding(num_items, embedding_dim)\n",
    "\n",
    "        # Linear layer\n",
    "        self.linear = nn.Linear(embedding_dim, 1)\n",
    "\n",
    "        # Initialize user history vectors\n",
    "        self.user_history = torch.zeros((num_users, num_items), dtype=torch.float32, requires_grad=False)\n",
    "\n",
    "        # Regularization strength\n",
    "        self.lambda_reg = lambda_reg\n",
    "\n",
    "    def forward(self, user, item):\n",
    "        #for user, item in zip(user_seq, item_seq):\n",
    "        self.user_history[user] = self.user_history[user] + F.one_hot(item, num_classes=self.user_history.size(1)).float()\n",
    "\n",
    "        # User embedding using RNN\n",
    "        user_emb, _ = self.rnn(self.user_history[user])\n",
    "\n",
    "        # Item embedding\n",
    "        item_emb = self.item_embedding(item)\n",
    "\n",
    "        # Linear layer\n",
    "        output = torch.matmul(user_emb, item_emb.t())\n",
    "        output = output.squeeze(0)\n",
    "        # output = user_emb * item_emb\n",
    "        # output=torch.sum(output)\n",
    "        #print(output)\n",
    "        return output\n",
    "\n",
    "# Assuming train_data is a pandas DataFrame containing the training data\n",
    "# Columns: ['userId', 'movieId', 'rating', 'timestamp']\n",
    "\n",
    "# Constants\n",
    "num_users = 6040  # Adjust according to your dataset\n",
    "num_items = 3952  # Adjust according to your dataset\n",
    "embedding_dim = 64  # Adjust as needed\n",
    "lambda_reg = 0.001  # Adjust as needed\n",
    "\n",
    "# Initialize your model\n",
    "model = YourRecommender(num_users, num_items, embedding_dim, lambda_reg)\n",
    "\n",
    "# Loss function and optimizer\n",
    "criterion = nn.MSELoss()\n",
    "optimizer = optim.SGD(model.parameters(), lr=0.01)\n",
    "\n",
    "# Training loop\n",
    "num_epochs = 10\n",
    "for epoch in range(num_epochs):\n",
    "    model.train()\n",
    "    train_losses=[]\n",
    "    for _, row in tqdm(train_df.iterrows()):\n",
    "        user_id = row['user_int']\n",
    "        item_id = row['movie_id']\n",
    "        rating = row['rating']\n",
    "\n",
    "        # Convert data to tensors\n",
    "        user_seq = torch.LongTensor([user_id])\n",
    "        item_seq = torch.LongTensor([item_id])\n",
    "        #item_seq_len = torch.LongTensor([1])  # Assuming it's just the current item\n",
    "\n",
    "        # Forward pass\n",
    "        predicted_rating = model(user_seq, item_seq)\n",
    "        #print(predicted_rating)\n",
    "        # Compute loss\n",
    "        loss = criterion(predicted_rating, torch.FloatTensor([rating]))\n",
    "\n",
    "        # Add regularization term\n",
    "        reg_loss = 0.5 * model.lambda_reg * (torch.norm(model.rnn.weight_hh_l0) ** 2 +\n",
    "                                             torch.norm(model.rnn.weight_ih_l0) ** 2)\n",
    "        loss += reg_loss\n",
    "\n",
    "        # Backward and optimize\n",
    "        optimizer.zero_grad()\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "        train_losses.append(loss.item())\n",
    "        \n",
    "    model.eval()\n",
    "    val_losses = []\n",
    "    with torch.no_grad():\n",
    "        for _, val_row in valid_df.iterrows():\n",
    "            val_user_id = val_row['user_int']\n",
    "            val_item_id = val_row['movie_id']\n",
    "            val_rating = val_row['rating']\n",
    "\n",
    "            # Convert data to tensors\n",
    "            val_user_seq = torch.LongTensor([val_user_id])\n",
    "            val_item_seq = torch.LongTensor([val_item_id])\n",
    "            #val_item_seq_len = torch.LongTensor([1])  # Assuming it's just the current item\n",
    "\n",
    "            # Forward pass\n",
    "            val_predicted_rating = model(val_user_seq, val_item_seq)\n",
    "\n",
    "            # Compute validation loss\n",
    "            val_loss = criterion(val_predicted_rating, torch.FloatTensor([val_rating]))\n",
    "            val_losses.append(val_loss.item())\n",
    "\n",
    "    # Log train and validation loss\n",
    "    print(f'Epoch {epoch + 1}/{num_epochs} - '\n",
    "          f'Train Loss: {sum(train_losses) / len(train_losses):.4f}, '\n",
    "          f'Validation Loss: {sum(val_losses) / len(val_losses):.4f}')\n",
    "\n",
    "\n",
    "# Remember to save your model after training\n",
    "torch.save(model.state_dict(), 'your_model.pth')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(len(train_df))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import numpy as np\n",
    "from torch.autograd import Variable\n",
    "\n",
    "class RRN(nn.Module):\n",
    "    def __init__(self):\n",
    "        super(RRN, self).__init__()\n",
    "\n",
    "        # Hyperparameters\n",
    "        self.batch_size = 500\n",
    "        self.n_step = 1\n",
    "        self.lr = 0.001\n",
    "        self.verbose = 100\n",
    "\n",
    "        # Data\n",
    "        dataSet = Data(\"ml-1m\")  # Assuming Data class is implemented\n",
    "        a, b = dataSet.data\n",
    "        self.train = a.values\n",
    "        #print(self.train.shape)\n",
    "        # print(len(np.unique(self.train[:, 1])))\n",
    "        self.valid = b.values\n",
    "\n",
    "        # Model\n",
    "        self.add_embedding_layer()\n",
    "\n",
    "        # Loss and Optimizer\n",
    "        self.criterion = nn.MSELoss()\n",
    "        self.optimizer = optim.Adam(self.parameters(), lr=self.lr)\n",
    "\n",
    "    def save_model(self):\n",
    "        # Save the model\n",
    "        torch.save(self.state_dict(), \"rrn_model_1.pth\")\n",
    "        print(\"Model saved\")\n",
    "\n",
    "    def add_embedding_layer(self):\n",
    "        self.user_embedding = nn.Embedding(6040, 128)\n",
    "        self.movie_embedding = nn.Embedding(3952, 128)\n",
    "        self.user_rnn = nn.GRU(128, 128, batch_first=True)\n",
    "        self.movie_rnn = nn.GRU(128, 128, batch_first=True)\n",
    "        self.user_output_layer = nn.Linear(128, 64)\n",
    "        self.movie_output_layer = nn.Linear(128, 64)\n",
    "\n",
    "    def forward(self, userID, movieID):\n",
    "        uid_embedding = self.user_embedding(userID)\n",
    "        mid_embedding = self.movie_embedding(movieID)\n",
    "\n",
    "        user_rnn_output, _ = self.user_rnn(mid_embedding)\n",
    "        movie_rnn_output, _ = self.movie_rnn(uid_embedding)\n",
    "\n",
    "        #user_output = self.user_output_layer(user_rnn_output[:, -1, :])\n",
    "        user_output = self.user_output_layer(user_rnn_output)\n",
    "        movie_output = self.movie_output_layer(movie_rnn_output)\n",
    "\n",
    "        pred = torch.sum(user_output * movie_output, dim=1, keepdim=True)\n",
    "\n",
    "        return pred\n",
    "\n",
    "    def run(self):\n",
    "        length = len(self.train)\n",
    "        batches = length // self.batch_size + 1\n",
    "\n",
    "        train_loss = []\n",
    "        valid_loss = []\n",
    "\n",
    "        for i in range(batches):\n",
    "            minIdx = i * self.batch_size\n",
    "            maxIdx = min(length, (i + 1) * self.batch_size)\n",
    "            train_batch = self.train[minIdx:maxIdx]\n",
    "            feed_dict_train = self.create_feed_dict(train_batch)\n",
    "\n",
    "            outputs = self.forward(feed_dict_train['userID'], feed_dict_train['movieID'])\n",
    "            # print(outputs.shape)\n",
    "            # print(outputs)\n",
    "            # print(feed_dict_train['rating'].shape)\n",
    "            # print(feed_dict_train['rating'].view(-1,1))\n",
    "            loss = self.criterion(outputs, feed_dict_train['rating'].view(-1,1))\n",
    "            train_loss.append(loss.item())\n",
    "\n",
    "            self.optimizer.zero_grad()\n",
    "            loss.backward()\n",
    "            self.optimizer.step()\n",
    "\n",
    "            if i % self.verbose == 0:\n",
    "                print('\\rTraining: Batch {}/{} - Loss: {:.4f}'.format(\n",
    "                    i, batches, np.sqrt(np.mean(train_loss[-20:]))\n",
    "                ), end='')\n",
    "\n",
    "            # Check validation loss every verbose steps\n",
    "            if i % self.verbose == 0 and i != 0:\n",
    "                feed_dict_valid = self.create_feed_dict(self.valid)\n",
    "                outputs_valid = self.forward(feed_dict_valid['userID'], feed_dict_valid['movieID'])\n",
    "                valid_loss_epoch = self.criterion(outputs_valid, feed_dict_valid['rating'].view(-1,1)).item()\n",
    "                valid_loss.append(np.sqrt(valid_loss_epoch))\n",
    "                print(' - Validation Loss: {:.4f}'.format(valid_loss[-1]), end='')\n",
    "\n",
    "        print(\"\\nTraining Finish, Last 2000 batches loss is {}.\".format(\n",
    "            np.sqrt(np.mean(train_loss[-2000:]))\n",
    "        ))\n",
    "        feed_dict_valid = self.create_feed_dict(self.valid)\n",
    "        outputs_valid = self.forward(feed_dict_valid['userID'], feed_dict_valid['movieID'])\n",
    "        valid_loss_epoch = self.criterion(outputs_valid, feed_dict_valid['rating'].view(-1,1)).item()\n",
    "        print(\"Validation Loss: {:.4f}\".format(np.sqrt(valid_loss_epoch)))\n",
    "        self.save_model()\n",
    "\n",
    "    def create_feed_dict(self, data):\n",
    "        userID = torch.LongTensor([i[0] - 1 for i in data])\n",
    "        movieID = torch.LongTensor([i[1] - 1 for i in data])\n",
    "        ratings = torch.FloatTensor([float(i[2]) for i in data])\n",
    "        return {\n",
    "            'userID': userID,\n",
    "            'movieID': movieID,\n",
    "            'rating': ratings,\n",
    "        }\n",
    "\n",
    "\n",
    "# if __name__ == '__main__':\n",
    "#     model = RRN()\n",
    "#     model.run()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "model = torch.load('rrn_model_1.pth')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_user_vector(model, user_history):\n",
    "    user_history = torch.LongTensor(user_history).unsqueeze(0)  # Add batch dimension\n",
    "    user_embeddings = model.movie_embedding(user_history)\n",
    "    _, user_hidden = model.user_rnn(user_embeddings)\n",
    "    user_vector = model.user_output_layer(user_hidden.squeeze(0))\n",
    "    return user_vector"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = RRN()\n",
    "model.load_state_dict(torch.load('rrn_model_1.pth'))\n",
    "# model.eval()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Assume the model is trained and stored in the 'model' variable\n",
    "user_history = [1, 5, 10, 20]  # Example user history (list of movie IDs)\n",
    "user_vector = get_user_vector(model,user_history)\n",
    "print(user_vector)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "RecBole"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "class AbstractRecommender(nn.Module):\n",
    "    r\"\"\"Base class for all models\"\"\"\n",
    "\n",
    "    def __init__(self):\n",
    "        self.logger = getLogger()\n",
    "        super(AbstractRecommender, self).__init__()\n",
    "\n",
    "    def calculate_loss(self, interaction):\n",
    "        r\"\"\"Calculate the training loss for a batch data.\n",
    "\n",
    "        Args:\n",
    "            interaction (Interaction): Interaction class of the batch.\n",
    "\n",
    "        Returns:\n",
    "            torch.Tensor: Training loss, shape: []\n",
    "        \"\"\"\n",
    "        raise NotImplementedError\n",
    "\n",
    "    def predict(self, interaction):\n",
    "        r\"\"\"Predict the scores between users and items.\n",
    "\n",
    "        Args:\n",
    "            interaction (Interaction): Interaction class of the batch.\n",
    "\n",
    "        Returns:\n",
    "            torch.Tensor: Predicted scores for given users and items, shape: [batch_size]\n",
    "        \"\"\"\n",
    "        raise NotImplementedError\n",
    "\n",
    "    def full_sort_predict(self, interaction):\n",
    "        r\"\"\"full sort prediction function.\n",
    "        Given users, calculate the scores between users and all candidate items.\n",
    "\n",
    "        Args:\n",
    "            interaction (Interaction): Interaction class of the batch.\n",
    "\n",
    "        Returns:\n",
    "            torch.Tensor: Predicted scores for given users and all candidate items,\n",
    "            shape: [n_batch_users * n_candidate_items]\n",
    "        \"\"\"\n",
    "        raise NotImplementedError\n",
    "\n",
    "    def other_parameter(self):\n",
    "        if hasattr(self, \"other_parameter_name\"):\n",
    "            return {key: getattr(self, key) for key in self.other_parameter_name}\n",
    "        return dict()\n",
    "\n",
    "    def load_other_parameter(self, para):\n",
    "        if para is None:\n",
    "            return\n",
    "        for key, value in para.items():\n",
    "            setattr(self, key, value)\n",
    "\n",
    "    def __str__(self):\n",
    "        \"\"\"\n",
    "        Model prints with number of trainable parameters\n",
    "        \"\"\"\n",
    "        model_parameters = filter(lambda p: p.requires_grad, self.parameters())\n",
    "        params = sum([np.prod(p.size()) for p in model_parameters])\n",
    "        return (\n",
    "            super().__str__()\n",
    "            + set_color(\"\\nTrainable parameters\", \"blue\")\n",
    "            + f\": {params}\"\n",
    "        )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "class SequentialRecommender(AbstractRecommender):\n",
    "    \"\"\"\n",
    "    This is a abstract sequential recommender. All the sequential model should implement This class.\n",
    "    \"\"\"\n",
    "\n",
    "    #type = ModelType.SEQUENTIAL\n",
    "\n",
    "    def __init__(self, config, dataset):\n",
    "        super(SequentialRecommender, self).__init__()\n",
    "\n",
    "        # load dataset info\n",
    "        self.USER_ID = config[\"USER_ID_FIELD\"]\n",
    "        self.ITEM_ID = config[\"ITEM_ID_FIELD\"]\n",
    "        self.ITEM_SEQ = self.ITEM_ID + config[\"LIST_SUFFIX\"]\n",
    "        self.ITEM_SEQ_LEN = config[\"ITEM_LIST_LENGTH_FIELD\"]\n",
    "        self.POS_ITEM_ID = self.ITEM_ID\n",
    "        self.NEG_ITEM_ID = config[\"NEG_PREFIX\"] + self.ITEM_ID\n",
    "        self.max_seq_length = config[\"MAX_ITEM_LIST_LENGTH\"]\n",
    "        self.n_items = dataset.num(self.ITEM_ID)\n",
    "\n",
    "        # load parameters info\n",
    "        self.device = config[\"device\"]\n",
    "\n",
    "    def gather_indexes(self, output, gather_index):\n",
    "        \"\"\"Gathers the vectors at the specific positions over a minibatch\"\"\"\n",
    "        gather_index = gather_index.view(-1, 1, 1).expand(-1, -1, output.shape[-1])\n",
    "        output_tensor = output.gather(dim=1, index=gather_index)\n",
    "        return output_tensor.squeeze(1)\n",
    "\n",
    "    def get_attention_mask(self, item_seq, bidirectional=False):\n",
    "        \"\"\"Generate left-to-right uni-directional or bidirectional attention mask for multi-head attention.\"\"\"\n",
    "        attention_mask = item_seq != 0\n",
    "        extended_attention_mask = attention_mask.unsqueeze(1).unsqueeze(2)  # torch.bool\n",
    "        if not bidirectional:\n",
    "            extended_attention_mask = torch.tril(\n",
    "                extended_attention_mask.expand((-1, -1, item_seq.size(-1), -1))\n",
    "            )\n",
    "        extended_attention_mask = torch.where(extended_attention_mask, 0.0, -10000.0)\n",
    "        return extended_attention_mask\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from torch import nn\n",
    "from torch.nn.init import xavier_uniform_, xavier_normal_\n",
    "\n",
    "#from recbole.model.abstract_recommender import SequentialRecommender\n",
    "from recbole.model.loss import BPRLoss\n",
    "\n",
    "\n",
    "class GRU4Rec(SequentialRecommender):\n",
    "    r\"\"\"GRU4Rec is a model that incorporate RNN for recommendation.\n",
    "\n",
    "    Note:\n",
    "\n",
    "        Regarding the innovation of this article,we can only achieve the data augmentation mentioned\n",
    "        in the paper and directly output the embedding of the item,\n",
    "        in order that the generation method we used is common to other sequential models.\n",
    "    \"\"\"\n",
    "\n",
    "    def __init__(self, config, dataset):\n",
    "        super(GRU4Rec, self).__init__(config, dataset)\n",
    "\n",
    "        # load parameters info\n",
    "        self.embedding_size = config[\"embedding_size\"]\n",
    "        self.hidden_size = config[\"hidden_size\"]\n",
    "        self.loss_type = config[\"loss_type\"]\n",
    "        self.num_layers = config[\"num_layers\"]\n",
    "        self.dropout_prob = config[\"dropout_prob\"]\n",
    "\n",
    "        # define layers and loss\n",
    "        self.item_embedding = nn.Embedding(\n",
    "            self.n_items, self.embedding_size, padding_idx=0\n",
    "        )\n",
    "        self.emb_dropout = nn.Dropout(self.dropout_prob)\n",
    "        self.gru_layers = nn.GRU(\n",
    "            input_size=self.embedding_size,\n",
    "            hidden_size=self.hidden_size,\n",
    "            num_layers=self.num_layers,\n",
    "            bias=False,\n",
    "            batch_first=True,\n",
    "        )\n",
    "        self.dense = nn.Linear(self.hidden_size, self.embedding_size)\n",
    "        # if self.loss_type == \"BPR\":\n",
    "        #     self.loss_fct = BPRLoss()\n",
    "        if self.loss_type == \"CE\":\n",
    "            self.loss_fct = nn.CrossEntropyLoss()\n",
    "        else:\n",
    "            raise NotImplementedError(\"Make sure 'loss_type' in ['BPR', 'CE']!\")\n",
    "\n",
    "        # parameters initialization\n",
    "        self.apply(self._init_weights)\n",
    "\n",
    "    def _init_weights(self, module):\n",
    "        if isinstance(module, nn.Embedding):\n",
    "            xavier_normal_(module.weight)\n",
    "        elif isinstance(module, nn.GRU):\n",
    "            xavier_uniform_(module.weight_hh_l0)\n",
    "            xavier_uniform_(module.weight_ih_l0)\n",
    "\n",
    "    def forward(self, item_seq, item_seq_len):\n",
    "        item_seq_emb = self.item_embedding(item_seq)\n",
    "        item_seq_emb_dropout = self.emb_dropout(item_seq_emb)\n",
    "        gru_output, _ = self.gru_layers(item_seq_emb_dropout)\n",
    "        gru_output = self.dense(gru_output)\n",
    "        # the embedding of the predicted item, shape of (batch_size, embedding_size)\n",
    "        seq_output = self.gather_indexes(gru_output, item_seq_len - 1)\n",
    "        return seq_output\n",
    "\n",
    "    def calculate_loss(self, interaction):\n",
    "        item_seq = interaction[self.ITEM_SEQ]\n",
    "        item_seq_len = interaction[self.ITEM_SEQ_LEN]\n",
    "        seq_output = self.forward(item_seq, item_seq_len)\n",
    "        pos_items = interaction[self.POS_ITEM_ID]\n",
    "        # if self.loss_type == \"BPR\":\n",
    "        #     neg_items = interaction[self.NEG_ITEM_ID]\n",
    "        #     pos_items_emb = self.item_embedding(pos_items)\n",
    "        #     neg_items_emb = self.item_embedding(neg_items)\n",
    "        #     pos_score = torch.sum(seq_output * pos_items_emb, dim=-1)  # [B]\n",
    "        #     neg_score = torch.sum(seq_output * neg_items_emb, dim=-1)  # [B]\n",
    "        #     loss = self.loss_fct(pos_score, neg_score)\n",
    "        #     return loss\n",
    "        #else:  # self.loss_type = 'CE'\n",
    "        test_item_emb = self.item_embedding.weight\n",
    "        logits = torch.matmul(seq_output, test_item_emb.transpose(0, 1))\n",
    "        loss = self.loss_fct(logits, pos_items)\n",
    "        return loss\n",
    "\n",
    "    def predict(self, interaction):\n",
    "        item_seq = interaction[self.ITEM_SEQ]\n",
    "        item_seq_len = interaction[self.ITEM_SEQ_LEN]\n",
    "        test_item = interaction[self.ITEM_ID]\n",
    "        seq_output = self.forward(item_seq, item_seq_len)\n",
    "        test_item_emb = self.item_embedding(test_item)\n",
    "        scores = torch.mul(seq_output, test_item_emb).sum(dim=1)  # [B]\n",
    "        return scores\n",
    "\n",
    "    def full_sort_predict(self, interaction):\n",
    "        item_seq = interaction[self.ITEM_SEQ]\n",
    "        item_seq_len = interaction[self.ITEM_SEQ_LEN]\n",
    "        seq_output = self.forward(item_seq, item_seq_len)\n",
    "        test_items_emb = self.item_embedding.weight\n",
    "        scores = torch.matmul(\n",
    "            seq_output, test_items_emb.transpose(0, 1)\n",
    "        )  # [B, n_items]\n",
    "        return scores"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "ChatGPT"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import openai\n",
    "\n",
    "# Set your OpenAI GPT-3 API key\n",
    "openai.api_key = 'your-api-key'\n",
    "\n",
    "def simulate_user_interaction(user_profile, recommended_list, user_history=[]):\n",
    "    # Get recommendations from ChatGPT\n",
    "    response = openai.Completion.create(\n",
    "        engine=\"text-davinci-003\",\n",
    "        prompt=f\"User Profile: {user_profile}\\nRecommended List: {recommended_list}\\nChoose an item and provide a rating:\",\n",
    "        temperature=0.7,\n",
    "        max_tokens=100\n",
    "    )\n",
    "\n",
    "    # Extract user's choice and rating from the response\n",
    "    user_choice = \"Chosen Movie\"  # Extract from the response\n",
    "    user_rating = 5.0  # Extract from the response\n",
    "\n",
    "    # Check if the user's choice is from the recommended list\n",
    "    if user_choice in recommended_list:\n",
    "        # Add the chosen movie and rating to the user's history\n",
    "        user_history.append((user_choice, user_rating))\n",
    "    else:\n",
    "        print(\"User's choice is not in the recommended list.\")\n",
    "\n",
    "    # Provide user choice and rating for further interaction\n",
    "    next_input = f\"User Choice: {user_choice}\\nUser Rating: {user_rating}\\nRecommended List: {recommended_list}\\nWhat do you recommend next?\"\n",
    "\n",
    "    # Continue the conversation\n",
    "    response = openai.Completion.create(\n",
    "        engine=\"text-davinci-003\",\n",
    "        prompt=next_input,\n",
    "        temperature=0.7,\n",
    "        max_tokens=100\n",
    "    )\n",
    "\n",
    "    return user_history\n",
    "\n",
    "# Example usage\n",
    "user_profile = \"Likes romcoms, rates highly.\"\n",
    "recommended_list = [\"Movie A\", \"Movie B\", \"Movie C\"]\n",
    "\n",
    "# Simulate user interactions\n",
    "user_history = simulate_user_interaction(user_profile, recommended_list)\n",
    "print(\"User History:\", user_history)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "from openai import OpenAI\n",
    "client = OpenAI(api_key=\"\")\n",
    "\n",
    "prompt = \"Please read the following multiple-choice question carefully and select ONE of the listed option's letters ONLY. How much, if at all, do you worry about the following happening to you? Being the victim of a terrorist attack \\\n",
    "    A. Worry a lot \\\n",
    "    B. Worry a little \\\n",
    "    C. Do not worry at all \\\n",
    "    D. Refused to anser\"\n",
    "gpt_35_turbo_responses=[]\n",
    "\n",
    "try:\n",
    "    completion = client.chat.completions.create(\n",
    "        model=\"gpt-3.5-turbo\",\n",
    "        messages=[\n",
    "            {\n",
    "                \"role\": \"assistant\",\n",
    "                \"content\": prompt\n",
    "            },\n",
    "        ],\n",
    "        temperature=0,\n",
    "        logprobs=True,\n",
    "        top_logprobs=5,\n",
    "        seed=42,\n",
    "        # max_tokens\n",
    "    )\n",
    "    response = json.loads(completion.model_dump_json(indent=2))\n",
    "    gpt_35_turbo_responses.append(response)\n",
    "    print(gpt_35_turbo_responses)\n",
    "\n",
    "except Exception as e:\n",
    "    # Handle the exception here, such as printing an error message\n",
    "    print(f\"Error occurred for prompt: {prompt}\")\n",
    "    print(f\"Error details: {e}\")\n",
    "    gpt_35_turbo_responses.append({\"error\": str(e)})\n",
    "    "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Reachability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#5 is the user we are looking at\n",
    "chosen_item = trainset.ur[5][-1][0]\n",
    "chosen_rating = trainset.ur[5][-1][1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(trainset.ur[4])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_item"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "already_rated = list(user_item_rating_dict[5].keys())\n",
    "ratings = user_item_rating_dict[5]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from tqdm import tqdm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor_single(user_vector, items, ratings):\n",
    "    Q_list = [model_last_item.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor(user_vector, items, ratings):\n",
    "    Q_list = [model.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor_five(user_vector, items, ratings):\n",
    "    Q_list = [model_last_five.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(model.qi)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in ratings:\n",
    "    ratings[i]=torch.tensor(ratings[i], dtype=torch.float64)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "rating_tensor = torch.tensor(list(ratings.values()))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_dict = ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendations(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendation_scores(user_vector, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "    count_var = 0\n",
    "    top_10_item_names=[]\n",
    "    top_10_item_scores=torch.tensor([1, 2, 3, 4, 5, 6, 7, 8, 9, 10], dtype=torch.float64)\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        item_score = i[1]\n",
    "        if item_id not in already_rated:\n",
    "            top_10_item_scores[count_var]=item_score\n",
    "            count_var+=1\n",
    "            top_10_item_names.append(item_id)\n",
    "            # top_10_item_scores.append(item_score)\n",
    "        if count_var==10:\n",
    "            break\n",
    "    return top_10_item_names, top_10_item_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def list_difference_metric(list1, list2):\n",
    "    # Dictionary to store indices of elements in list2\n",
    "    indices_dict = {num: [] for num in list2}\n",
    "\n",
    "    # Populate indices_dict with indices of elements in list2\n",
    "    for idx, num in enumerate(list2):\n",
    "        indices_dict[num].append(idx)\n",
    "\n",
    "    # Calculate absolute difference of indices for each element in list1\n",
    "    abs_diff_sum = 0\n",
    "    for idx, num in enumerate(list1):\n",
    "        if num in indices_dict:\n",
    "            # Calculate absolute difference between index of num in list1 and mean index of num in list2\n",
    "            abs_diff_sum += abs(idx - sum(indices_dict[num]) / len(indices_dict[num]))\n",
    "\n",
    "    # Calculate the average absolute difference\n",
    "    if len(list1) > 0:\n",
    "        average_abs_diff = abs_diff_sum / len(list1)\n",
    "    else:\n",
    "        average_abs_diff = 0  # Handle case where list1 is empty\n",
    "\n",
    "    return average_abs_diff\n",
    "\n",
    "# Example usage\n",
    "list1 = [1, 2, 3, 4, 5]\n",
    "list2 = [5, 4, 2, 3, 1]\n",
    "difference_metric = list_difference_metric(list1, list2)\n",
    "print(\"Difference Metric:\", difference_metric)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!export https_proxy=http://proxy.cmu.edu:3128/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!export http_proxy=http://proxy.cmu.edu:3128/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#we will have 3 loops: 1 over epochs; another one over calculating objective; the last one is looping over the 5 steps"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch.nn.functional as F\n",
    "def get_recommendations_stochastic(user_vector, already_rated, sample_size):\n",
    "    beta = 0.8\n",
    "    num_samples = sample_size\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "        predicted_ratings[item] = item_rating\n",
    "    #sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    available_items = {item: rating for item, rating in predicted_ratings.items() if item not in already_rated}\n",
    "    \n",
    "    # Convert the predicted ratings dictionary to PyTorch tensor\n",
    "    ratings_tensor_1 = torch.tensor(list(available_items.values()), dtype=torch.float)\n",
    "    \n",
    "    # Compute probabilities proportional to exp(beta*predicted_rating)\n",
    "    probabilities = F.softmax(beta * ratings_tensor_1, dim=0)\n",
    "    \n",
    "    # Sample num_samples items based on the probability distribution\n",
    "    sampled_indices = torch.multinomial(probabilities, num_samples, replacement=False)\n",
    "    \n",
    "    # Convert indices to item names and corresponding predicted scores\n",
    "    sampled_items = [list(available_items.keys())[idx] for idx in sampled_indices]\n",
    "    # sampled_scores = [list(available_items.values())[idx] for idx in sampled_indices]\n",
    "    \n",
    "    return sampled_items#, sampled_scores\n",
    "        \n",
    "    # count_var = 0\n",
    "    # top_10_item_names=[]\n",
    "    # for i in sorted_pred_ratings:\n",
    "    #     item_id = i[0]\n",
    "    #     if item_id not in already_rated:\n",
    "    #         count_var+=1\n",
    "    #         top_10_item_names.append(item_id)\n",
    "    #     if count_var==10:\n",
    "    #         break\n",
    "    # return top_10_item_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_recommendation_scores_stochastic(user_vector, already_rated, sample_size, type_):\n",
    "    beta = 0.8\n",
    "    num_samples = sample_size\n",
    "    if type_ == 'keepall':\n",
    "        n_items =len(model.qi)\n",
    "    if type_ == 'single':\n",
    "        n_items =len(model_last_item.qi)\n",
    "    if type_ == 'five':\n",
    "        n_items =len(model_last_five.qi)\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    if type_ == 'keepall':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "            predicted_ratings[item] = item_rating\n",
    "    if type_ == 'single':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_item.qi[item])\n",
    "            predicted_ratings[item] = item_rating    \n",
    "    if type_ == 'five':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_five.qi[item])\n",
    "            predicted_ratings[item] = item_rating       \n",
    "    #sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    available_items = {item: rating for item, rating in predicted_ratings.items() if item not in already_rated}\n",
    "    \n",
    "    # Convert the predicted ratings dictionary to PyTorch tensor\n",
    "    ratings_tensor_1 = torch.tensor(list(available_items.values()), dtype=torch.float)\n",
    "    \n",
    "    # Compute probabilities proportional to exp(beta*predicted_rating)\n",
    "    probabilities = F.softmax(beta * ratings_tensor_1, dim=0)\n",
    "    \n",
    "    # Sample num_samples items based on the probability distribution\n",
    "    sampled_indices = torch.multinomial(probabilities, num_samples, replacement=False)\n",
    "    \n",
    "    # Convert indices to item names and corresponding predicted scores\n",
    "    sampled_items = [list(available_items.keys())[idx] for idx in sampled_indices]\n",
    "    sampled_scores = [list(available_items.values())[idx] for idx in sampled_indices]\n",
    "    \n",
    "    return sampled_items, sampled_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Stochastic choice\n",
    "# import wandb\n",
    "\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "sample_size=10\n",
    "user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 295\n",
    "min_score = float('inf')\n",
    "for epoch in tqdm(range(1, 50)):\n",
    "    item_rating = 0 \n",
    "    rating_vals = torch.zeros(20)\n",
    "    for int_var in range(0,20):\n",
    "        user_action_clamped = user_action.clamp(1, 5) \n",
    "        rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "        user_vector_initial = torch.from_numpy(model_last_item.pu[5])\n",
    "        user_vector = user_vector_initial\n",
    "        time_max = 5\n",
    "        already_rated = list(user_item_rating_dict[5].keys())\n",
    "        #already_rated = already_rated[:-1]\n",
    "        ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "        # del ratings[chosen_item]\n",
    "        ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "        # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "        n = len(ratings_old)\n",
    "        zeros_to_add = torch.zeros(time_max)\n",
    "        ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        #already_rated.append(chosen_item)\n",
    "        user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n])\n",
    "        for timestep in range(1, time_max+1):\n",
    "            recommendations, recommendation_scores = get_recommendation_scores_stochastic(user_vector, already_rated, sample_size, 'single')\n",
    "            usr_type = UserType(\"Choice Enjoyer\", torch.tensor(recommendation_scores), [], beta=0.8)\n",
    "            choice_of_item = recommendations[usr_type.item_choice]\n",
    "            ratings[n+timestep-1] = torch.tensor(usr_type.item_rating)\n",
    "            already_rated.append(choice_of_item)\n",
    "            user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n+timestep])\n",
    "        item_rating = torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item_to_be_reached]))\n",
    "        rating_vals[int_var] = item_rating\n",
    "    fin_rating = -torch.exp(0.8*torch.sum(rating_vals)/len(rating_vals))\n",
    "    print(abs(fin_rating))\n",
    "    fin_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "total_sum=0\n",
    "for item in range(len(model_last_item.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item])))\n",
    "print(-fin_rating/total_sum)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Repeated top cell for my version case below:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "###########REPEATED##############(it's the og using my original idea, not reachability paper)#\n",
    "\n",
    "\n",
    "#Stochastic choice\n",
    "# import wandb\n",
    "\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 15\n",
    "min_score = float('inf')\n",
    "for epoch in tqdm(range(1, 50)):\n",
    "    item_rating = 0 \n",
    "    rating_vals = torch.zeros(20)\n",
    "    for int_var in range(0,20):\n",
    "        user_action_clamped = user_action.clamp(1, 5) \n",
    "        rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "        user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "        user_vector = user_vector_initial\n",
    "        time_max = 5\n",
    "        already_rated = list(user_item_rating_dict[5].keys())\n",
    "        #already_rated = already_rated[:-1]\n",
    "        ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "        # del ratings[chosen_item]\n",
    "        ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "        # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "        n = len(ratings_old)\n",
    "        zeros_to_add = torch.zeros(time_max)\n",
    "        ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        #already_rated.append(chosen_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n])\n",
    "        for timestep in range(1, time_max+1):\n",
    "            recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "            #print(recommendation_scores)\n",
    "            min_score = min(recommendation_scores)\n",
    "            usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "            choice_of_item = recommendations[usr_type.item_choice]\n",
    "            ratings[n+timestep-1] = torch.tensor(usr_type.item_rating)\n",
    "            already_rated.append(choice_of_item)\n",
    "            user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep])\n",
    "        item_rating = -torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached]))\n",
    "        rating_vals[int_var] = item_rating\n",
    "    fin_rating = torch.sum(rating_vals)/len(rating_vals)\n",
    "    print(abs(fin_rating))\n",
    "    if abs(fin_rating)>min_score:\n",
    "        print(\"Item Reached\")\n",
    "        break\n",
    "    fin_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()\n",
    "    #user_action = user_action.clamp(1, 5) \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_action"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from torchviz import make_dot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Deterministic choice\n",
    "# import wandb\n",
    "\n",
    "# wandb.init(project=\"reachability-single-deterministic\", name=\"run_1_lr_0.08\")\n",
    "sample_size=1\n",
    "user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 9\n",
    "min_score = float('inf')\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5) \n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    #already_rated = already_rated[:-1]\n",
    "    ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "    # del ratings[chosen_item]\n",
    "    ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "    # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    #already_rated.append(chosen_item)\n",
    "    user_vector = update_user_tensor(user_vector, already_rated, ratings[:n])\n",
    "    for timestep in range(1, time_max+1):\n",
    "        recommendations, recommendation_scores = get_recommendation_scores_stochastic(user_vector, already_rated, sample_size)\n",
    "        # usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "        choice_of_item = recommendations[0]\n",
    "        ratings[n+timestep-1] = 5\n",
    "        already_rated.append(choice_of_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep])\n",
    "    item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached])))\n",
    "    print(abs(item_rating))\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Repeated below this"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "###########REPEATED##############(it's the og using my original idea, not reachability paper)#\n",
    "\n",
    "#Deterministic choice\n",
    "# import wandb\n",
    "\n",
    "# wandb.init(project=\"reachability-single-deterministic\", name=\"run_1_lr_0.08\")\n",
    "user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 8\n",
    "min_score = float('inf')\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5) \n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    #already_rated = already_rated[:-1]\n",
    "    ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "    # del ratings[chosen_item]\n",
    "    ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "    # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    #print(ratings)\n",
    "    #already_rated.append(chosen_item)\n",
    "    user_vector = update_user_tensor(user_vector, already_rated, ratings[:n])\n",
    "    for timestep in range(1, time_max+1):\n",
    "        recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "        #print(recommendation_scores)\n",
    "        min_score = min(recommendation_scores)\n",
    "        # usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "        choice_of_item = recommendations[0]\n",
    "        ratings[n+timestep-1] = 5\n",
    "        already_rated.append(choice_of_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep])\n",
    "    item_rating = -torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached]))\n",
    "    print(abs(item_rating))\n",
    "    if abs(item_rating)>min_score:\n",
    "        print(\"Item Reached\")\n",
    "        break\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# #Okay lets change this item\n",
    "# #Deterministic choice\n",
    "# user_action = torch.tensor(chosen_rating, requires_grad=True)\n",
    "# optimizer = torch.optim.Adam([user_action], lr=0.01)\n",
    "# item_to_be_reached = 8\n",
    "# target_item_embedding = torch.from_numpy(model.qi[item_to_be_reached])\n",
    "# for epoch in range(1, 50):\n",
    "#     # user_action_clamped = user_action.clamp(1, 5) \n",
    "#     user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "#     user_vector = user_vector_initial\n",
    "#     time_max = 5\n",
    "#     already_rated = list(user_item_rating_dict[5].keys())\n",
    "#     #print(already_rated)\n",
    "#     #already_rated = already_rated[:-1]\n",
    "#     ratings = user_item_rating_dict[5]\n",
    "#     # del ratings[chosen_item]\n",
    "#     ratings[chosen_item] = user_action.item()\n",
    "#     #print(ratings)\n",
    "#     #already_rated.append(chosen_item)\n",
    "#     user_vector = torch.from_numpy(update_user_vector(user_vector, already_rated, np.array(list(ratings.values()))))\n",
    "#     for timestep in tqdm(range(1, time_max+1)):\n",
    "#         recommendations = get_recommendations(user_vector, already_rated)\n",
    "#         choice_of_item = recommendations[0]\n",
    "#         ratings[choice_of_item] = 5\n",
    "#         already_rated.append(choice_of_item)\n",
    "#         user_vector = torch.from_numpy(update_user_vector(user_vector, already_rated, np.array(list(ratings.values()))))\n",
    "#     item_rating = -torch.matmul(user_vector, target_item_embedding)\n",
    "#     print(item_rating)\n",
    "#     item_rating.requires_grad_()\n",
    "#     item_rating.backward()\n",
    "#     #user_action.retain_grad()\n",
    "#     optimizer.step()\n",
    "#     # print(user_action.grad)\n",
    "#     # print(user_action)\n",
    "#     #print(item_rating.grad)\n",
    "#     optimizer.zero_grad()\n",
    "#     #user_action = torch.clamp(user_action, min=1, max=5)\n",
    "#     #user_action = user_action.clamp(1, 5) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "t1_set = trainset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset.to_raw_uid(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "t1_set.to_raw_iid(9)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "t1_set.all_ratings()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "t1_set"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#5 is the user we are looking at\n",
    "item_and_rating =  trainset.ur[5][-5:]\n",
    "chosen_items = [i[0] for i in item_and_rating]\n",
    "chosen_ratings = [i[1] for i in item_and_rating]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items_raw = [i+1 for i in chosen_items]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items_raw"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "filtered_ratings_df = ratings_df[~((ratings_df['user_int'] == 6) & (ratings_df['movie_id'].isin(chosen_items_raw)))]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "filtered_ratings_df[filtered_ratings_df['user_int']==6]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(filtered_ratings_df[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "model_last_5 = SVD(biased=False)\n",
    "\n",
    "# Perform cross-validation\n",
    "cv_results = cross_validate(model, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# Print the cross-validation results\n",
    "for measure in ['test_rmse', 'test_mae']:\n",
    "    print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset2 = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "model_last_5.fit(trainset2)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_action = torch.tensor(chosen_ratings)\n",
    "print(user_action)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!export https_proxy=http://proxy.cmu.edu:3128/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-history\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 8\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model_last_five.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    already_rated = already_rated[:-5]\n",
    "    ratings_old = rating_tensor[:-5]\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    # del ratings[chosen_item]\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        curr_item = chosen_items[timestep]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor_five(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_five.qi[item_to_be_reached])))\n",
    "    print(abs(item_rating))\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "ok below this is repeated (I mean the OG)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "##########REPEATED with my original take#############\n",
    "\n",
    "\n",
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-history\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 8\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    already_rated = already_rated[:-5]\n",
    "    ratings_old = rating_tensor[:-5]\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        curr_item = chosen_items[timestep]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    item_rating = -torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached]))\n",
    "    print(abs(item_rating))\n",
    "    recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "    if min(recommendation_scores)<item_rating:\n",
    "        print(\"Item Reached\")\n",
    "        break\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.matmul(torch.from_numpy(model.pu[5]), torch.from_numpy(model.qi[item_to_be_reached]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#looking at the future\n",
    "#I should be able to choose best possible item too\n",
    "#greedy?\n",
    "#how can this optimization be consistent across epochs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-future\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 8\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    ratings_old = rating_tensor\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "        curr_item = recommendations[0]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    item_rating = -torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached]))\n",
    "    print(abs(item_rating))\n",
    "    recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "    if min(recommendation_scores)<item_rating:\n",
    "        print(\"Item Reached\")\n",
    "        break\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Real thing below"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#########REPEATED##########\n",
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-future\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 8\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 5\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    already_rated = already_rated[:-5]\n",
    "    #print(already_rated)\n",
    "    #already_rated = already_rated[:-1]\n",
    "    ratings_old = rating_tensor[:-5]\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    # del ratings[chosen_item]\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "        curr_item = recommendations[0]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    item_rating = -torch.matmul(user_vector, torch.from_numpy(model.qi[item_to_be_reached]))\n",
    "    print(abs(item_rating))\n",
    "    recommendations, recommendation_scores = get_recommendation_scores(user_vector, already_rated)\n",
    "    if min(recommendation_scores)<item_rating:\n",
    "        print(\"Item Reached\")\n",
    "        break\n",
    "    item_rating.backward()\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#ok time to create influential and non-influential users\n",
    "ratings_count = {}\n",
    "for user_id, ratings1 in trainset.ur.items():\n",
    "    # Count the number of ratings for the user and store it in ratings_count\n",
    "    ratings_count[user_id] = len(ratings1)\n",
    "\n",
    "# Sort the ratings_count dictionary by the number of ratings in descending order\n",
    "sorted_ratings_count = sorted(ratings_count.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "# Get the top 10 influential users based on the number of ratings\n",
    "top_influential_users = [user_id for user_id, _ in sorted_ratings_count[:10]]\n",
    "\n",
    "print(\"Top 10 influential users based on the number of ratings:\")\n",
    "print(top_influential_users)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the top 10 influential users based on the number of ratings\n",
    "least_influential_users = [user_id for user_id, _ in sorted_ratings_count[-10:]]\n",
    "\n",
    "print(\"Top 10 least influential users based on the number of ratings:\")\n",
    "print(least_influential_users)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mid_users = [i for i, _ in sorted_ratings_count[199:210]]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mid_users"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_ratings_count"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Stochastic choice\n",
    "# import wandb\n",
    "outer_reach_prob =[]\n",
    "for u in tqdm(top_influential_users):\n",
    "    print(\"Hey\")\n",
    "    n_items = len(model_last_item.qi)\n",
    "    all_items = list(range(n_items))\n",
    "    already_rated_outer = list(user_item_rating_dict[u].keys())\n",
    "    # Remove items that are already rated\n",
    "    available_items = [item for item in all_items if item not in already_rated_outer]\n",
    "    # Sample num_samples items at random from available_items\n",
    "    items_to_be_reached = random.sample(available_items, min(7, len(available_items)))\n",
    "    #select a pool of 50 items that the user has not rated\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "    reach_probabilities = []\n",
    "    for i in items_to_be_reached:\n",
    "        print(\"Ho\")\n",
    "        final_rating=0\n",
    "        sample_size=10\n",
    "        chosen_rating = 0\n",
    "        user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "        optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "        item_to_be_reached = i\n",
    "        min_score = float('inf')\n",
    "        ratings_dict1 = user_item_rating_dict[u]\n",
    "        for j in user_item_rating_dict[u]:\n",
    "            ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "        ratings_dict = ratings_dict1\n",
    "        for epoch in range(1, 50):\n",
    "            item_rating = 0 \n",
    "            rating_vals = torch.zeros(20)\n",
    "            for int_var in range(0,20):\n",
    "                user_action_clamped = user_action.clamp(1, 5) \n",
    "                rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "                user_vector_initial = torch.from_numpy(model_last_item.pu[u])\n",
    "                user_vector = user_vector_initial\n",
    "                time_max = 0\n",
    "                already_rated = list(user_item_rating_dict[u].keys())\n",
    "                #print(already_rated)\n",
    "                #already_rated = already_rated[:-1]\n",
    "                ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "                # del ratings[chosen_item]\n",
    "                ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "                # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "                n = len(ratings_old)\n",
    "                zeros_to_add = torch.zeros(time_max)\n",
    "                ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "                #already_rated.append(chosen_item)\n",
    "                user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n])\n",
    "                for timestep in range(1, time_max+1):\n",
    "                    recommendations, recommendation_scores = get_recommendation_scores_stochastic(user_vector, already_rated, sample_size, 'single')\n",
    "                    #print(recommendation_scores)\n",
    "                    #min_score = min(recommendation_scores)\n",
    "                    usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "                    choice_of_item = recommendations[usr_type.item_choice]\n",
    "                    ratings[n+timestep-1] = torch.tensor(usr_type.item_rating)\n",
    "                    already_rated.append(choice_of_item)\n",
    "                    user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n+timestep])\n",
    "                item_rating = torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item_to_be_reached]))\n",
    "                rating_vals[int_var] = item_rating\n",
    "            fin_rating = -torch.exp(0.8*torch.sum(rating_vals)/len(rating_vals))\n",
    "            fin_rating.backward()\n",
    "            optimizer.step()\n",
    "            # print(user_action.grad)\n",
    "            #print(user_action)\n",
    "            optimizer.zero_grad()\n",
    "            #user_action = user_action.clamp(1, 5) \n",
    "        final_rating = -fin_rating.item()\n",
    "        #now get probability\n",
    "        total_sum = 0\n",
    "        for item in range(len(model_last_item.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item])))\n",
    "        reach_probabilities.append(final_rating/total_sum)\n",
    "    outer_reach_prob.append(sum(reach_probabilities))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sum(outer_reach_prob)/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#mean was 0.0033333"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model_last_item.pu[5958]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Stochastic choice\n",
    "# import wandb\n",
    "outer_reach_prob_less =[]\n",
    "for u in mid_users:\n",
    "    print(\"Hey\")\n",
    "    n_items = len(model_last_item.qi)\n",
    "    all_items = list(range(n_items))\n",
    "    already_rated_outer = list(user_item_rating_dict[u].keys())\n",
    "    # Remove items that are already rated\n",
    "    available_items = [item for item in all_items if item not in already_rated_outer]\n",
    "    # Sample num_samples items at random from available_items\n",
    "    items_to_be_reached = random.sample(available_items, min(7, len(available_items)))\n",
    "    #select a pool of 50 items that the user has not rated\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "    reach_probabilities = []\n",
    "    for i in items_to_be_reached:\n",
    "        print(\"Ho\")\n",
    "        final_rating=0\n",
    "        sample_size=10\n",
    "        chosen_rating = 0\n",
    "        user_action = torch.tensor(chosen_rating, requires_grad=True, dtype=torch.float64)\n",
    "        optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "        item_to_be_reached = i\n",
    "        min_score = float('inf')\n",
    "        ratings_dict1 = user_item_rating_dict[u]\n",
    "        for j in user_item_rating_dict[u]:\n",
    "            ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "        ratings_dict = ratings_dict1\n",
    "        for epoch in range(1, 50):\n",
    "            item_rating = 0 \n",
    "            rating_vals = torch.zeros(20)\n",
    "            for int_var in range(0,20):\n",
    "                user_action_clamped = user_action.clamp(1, 5) \n",
    "                rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "                user_vector_initial = torch.from_numpy(model_last_item.pu[u])\n",
    "                user_vector = user_vector_initial\n",
    "                time_max = 0\n",
    "                already_rated = list(user_item_rating_dict[u].keys())\n",
    "                #print(already_rated)\n",
    "                #already_rated = already_rated[:-1]\n",
    "                ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "                # del ratings[chosen_item]\n",
    "                ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "                # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "                n = len(ratings_old)\n",
    "                zeros_to_add = torch.zeros(time_max)\n",
    "                ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "                #print(ratings)\n",
    "                #already_rated.append(chosen_item)\n",
    "                user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n])\n",
    "                for timestep in range(1, time_max+1):\n",
    "                    recommendations, recommendation_scores = get_recommendation_scores_stochastic(user_vector, already_rated, sample_size, 'single')\n",
    "                    #print(recommendation_scores)\n",
    "                    #min_score = min(recommendation_scores)\n",
    "                    usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "                    choice_of_item = recommendations[usr_type.item_choice]\n",
    "                    ratings[n+timestep-1] = torch.tensor(usr_type.item_rating)\n",
    "                    already_rated.append(choice_of_item)\n",
    "                    user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n+timestep])\n",
    "                item_rating = torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item_to_be_reached]))\n",
    "                rating_vals[int_var] = item_rating\n",
    "            fin_rating = -torch.exp(0.8*torch.sum(rating_vals)/len(rating_vals))\n",
    "            print(abs(fin_rating))\n",
    "            fin_rating.backward()\n",
    "            optimizer.step()\n",
    "            # print(user_action.grad)\n",
    "            #print(user_action)\n",
    "            optimizer.zero_grad()\n",
    "            #user_action = user_action.clamp(1, 5) \n",
    "        final_rating = -fin_rating.item()\n",
    "        #now get probability\n",
    "        total_sum = 0\n",
    "        for item in range(len(model_last_item.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item])))\n",
    "        reach_probabilities.append(final_rating/total_sum)\n",
    "    outer_reach_prob_less.append(sum(reach_probabilities))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob_less"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sum_prob=0\n",
    "for i in outer_reach_prob_less:\n",
    "    sum_prob+=i\n",
    "print(sum_prob/10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.matmul(model_last_item.pu[5937],model_last_item.qi[2956])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob_less"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Stochastic choice\n",
    "# import wandb\n",
    "outer_reach_prob1 =[]\n",
    "for u in top_influential_users:\n",
    "    print(\"Hey\")\n",
    "    all_items = list(range(n_items))\n",
    "    already_rated_outer = list(user_item_rating_dict[u].keys())\n",
    "    # Remove items that are already rated\n",
    "    available_items = [item for item in all_items if item not in already_rated_outer]\n",
    "    # Sample num_samples items at random from available_items\n",
    "    items_to_be_reached = random.sample(available_items, min(7, len(available_items)))\n",
    "    #select a pool of 50 items that the user has not rated\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "    item_and_rating =  trainset.ur[u][-5:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[u]\n",
    "    for j in user_item_rating_dict[u]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    for i in tqdm(items_to_be_reached):\n",
    "        print(\"Ho\")\n",
    "        final_rating=0\n",
    "        sample_size=10\n",
    "        user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "        optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "        item_to_be_reached = i\n",
    "        for epoch in range(1, 50):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.from_numpy(model_last_five.pu[u])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = 5\n",
    "            already_rated = list(user_item_rating_dict[u].keys())\n",
    "            already_rated = already_rated[:-5]\n",
    "            #print(already_rated)\n",
    "            #already_rated = already_rated[:-1]\n",
    "            ratings_old = rating_tensor[:-5]\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            # del ratings[chosen_item]\n",
    "            for timestep in range(0,time_max):\n",
    "                curr_item = chosen_items[timestep]\n",
    "                #print(curr_item)\n",
    "                ratings[n+timestep] = user_action_clamped[timestep]\n",
    "                #print(ratings)\n",
    "                already_rated.append(curr_item)\n",
    "                #print(len(already_rated))\n",
    "                #print(ratings[:n+timestep+1].shape)\n",
    "                user_vector = update_user_tensor_five(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_five.qi[item_to_be_reached])))\n",
    "            item_rating.backward()\n",
    "            optimizer.step()\n",
    "            # print(user_action.grad)\n",
    "            # print(user_action)\n",
    "            optimizer.zero_grad()\n",
    "            #user_action = user_action.clamp(1, 5) \n",
    "\n",
    "        final_rating = -item_rating.item()\n",
    "        #now get probability\n",
    "        total_sum = 0\n",
    "        for item in range(len(model_last_five.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.from_numpy(model_last_five.qi[item])))\n",
    "        reach_probabilities.append(final_rating/total_sum)\n",
    "    outer_reach_prob1.append(sum(reach_probabilities))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sum(outer_reach_prob1)/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Stochastic choice\n",
    "# import wandb\n",
    "outer_reach_prob1_less =[]\n",
    "for u in mid_users:\n",
    "    print(\"Hey\")\n",
    "    all_items = list(range(n_items))\n",
    "    already_rated_outer = list(user_item_rating_dict[u].keys())\n",
    "    # Remove items that are already rated\n",
    "    available_items = [item for item in all_items if item not in already_rated_outer]\n",
    "    # Sample num_samples items at random from available_items\n",
    "    items_to_be_reached = random.sample(available_items, min(7, len(available_items)))\n",
    "    #select a pool of 50 items that the user has not rated\n",
    "# wandb.init(project=\"reachability-single-stochastic\", name=\"run_1_lr_0.08\")\n",
    "    item_and_rating =  trainset.ur[u][-5:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[u]\n",
    "    for j in user_item_rating_dict[u]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    for i in tqdm(items_to_be_reached):\n",
    "        print(\"Ho\")\n",
    "        final_rating=0\n",
    "        sample_size=10\n",
    "        user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "        optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "        item_to_be_reached = i\n",
    "        for epoch in range(1, 50):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.from_numpy(model_last_five.pu[u])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = 5\n",
    "            already_rated = list(user_item_rating_dict[u].keys())\n",
    "            already_rated = already_rated[:-5]\n",
    "            #print(already_rated)\n",
    "            #already_rated = already_rated[:-1]\n",
    "            ratings_old = rating_tensor[:-5]\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            # del ratings[chosen_item]\n",
    "            for timestep in range(0,time_max):\n",
    "                curr_item = chosen_items[timestep]\n",
    "                #print(curr_item)\n",
    "                ratings[n+timestep] = user_action_clamped[timestep]\n",
    "                #print(ratings)\n",
    "                already_rated.append(curr_item)\n",
    "                #print(len(already_rated))\n",
    "                #print(ratings[:n+timestep+1].shape)\n",
    "                user_vector = update_user_tensor_five(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_five.qi[item_to_be_reached])))\n",
    "            item_rating.backward()\n",
    "            optimizer.step()\n",
    "            # print(user_action.grad)\n",
    "            # print(user_action)\n",
    "            optimizer.zero_grad()\n",
    "            #user_action = user_action.clamp(1, 5) \n",
    "\n",
    "        final_rating = -item_rating.item()\n",
    "        #now get probability\n",
    "        total_sum = 0\n",
    "        for item in range(len(model_last_five.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.from_numpy(model_last_five.qi[item])))\n",
    "        reach_probabilities.append(final_rating/total_sum)\n",
    "    outer_reach_prob1_less.append(sum(reach_probabilities))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob1_less"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "outer_reach_prob1_less"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sum(outer_reach_prob1_less)/10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay let's think about stability\n",
    "#so I select a user randomly, change some ratings uniformly at random. okay in this case I would have to retrain the recommender system right?\n",
    "#or just do what I did for users but with items: update_item_tensor?\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#param = user_action\n",
    "#okay lets say I am looking at item at history time 4 steps before current time\n",
    "#so does that mean the other interactions never happened?\n",
    "#then my latent vector is wrong even to start with\n",
    "\n",
    "# user_action = \n",
    "#what if the item gets recommended some time in the middle itself and I choose it\n",
    "#or do I specifically not choose it"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay so I want to optimize for user actions? best user action\n",
    "#my objective function is the probability that an item I want to reach is recommended and I am optimizing over the user action space, that's what I'm updating\n",
    "#    user_vector = update_user_vector(user_vector, already_rated, np.array(list(ratings.values())))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_item_tensor(item_vector, users, ratings):\n",
    "    Q_list = [model.pu[user] for user in users]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#create a table\n",
    "#each row indicates time, each column indicates item\n",
    "#t=0, need to decide (0, i1), (0, i2), (0, i3)\n",
    "#t=1, need to decide (1, i1 | (0, i1)), (1, i2 | (0, i1)), (1, i3 | (0, i1)); (1, i1 | (0, i2)), (1, i2 | (0, i2)), (1, i3 | (0, i2)); (1, i1 | (0, i3)), (1, i2 | (0, i3)), (1, i3 | (0, i3));\n",
    "#(t, i) + history -> RNN -> positive value\n",
    "#our current table: replying on user action is only time dependent but not history dependent\n",
    "#it'll give you the rating corresponding to that item\n",
    "#so I will change a user's rating for some item, then I will update the item vector\n",
    "#choose an adversarial user at random\n",
    "#now start choosing items and ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_users"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_items = len(model.qi)\n",
    "n_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_np = model.qi"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_all_preferences(user_vector, item_vector_copy, already_rated):\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ torch.tensor(item_vector_copy[item])\n",
    "        predicted_ratings[item] = item_rating\n",
    "    sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    count_var = 0\n",
    "    unrated_item_names=[]\n",
    "    for i in sorted_pred_ratings:\n",
    "        item_id = i[0]\n",
    "        if item_id not in already_rated:\n",
    "            count_var+=1\n",
    "            unrated_item_names.append(item_id)\n",
    "    return torch.tensor(unrated_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Consider user 20\n",
    "uid = 20\n",
    "other_users = []\n",
    "for i in range(0,n_users):\n",
    "    if i != uid:\n",
    "        other_users.append(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay here I define a neural network that takes a (t,i) tuple and a history vector as input and outputs a rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_user_matrix = trainset.ir"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_user_matrix"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.set_default_dtype(torch.float64)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import numpy as np\n",
    "\n",
    "# Define your RNN model\n",
    "class StabilityRNN(nn.Module):\n",
    "    def __init__(self, input_size, hidden_size, output_size):\n",
    "        super(StabilityRNN, self).__init__()\n",
    "        self.hidden_size = hidden_size\n",
    "        self.rnn = nn.RNN(input_size, hidden_size, batch_first=True)\n",
    "        self.fc = nn.Linear(hidden_size, output_size)\n",
    "\n",
    "    def forward(self, x):\n",
    "        out, _ = self.rnn(x)\n",
    "        out = self.fc(out[:, -1, :])\n",
    "        return out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# # Prepare your data\n",
    "# # Let's assume you have sequences of item IDs and their corresponding ratings\n",
    "# # Convert these sequences into PyTorch tensors\n",
    "# # For simplicity, let's assume each item ID and rating are represented as integers\n",
    "# rated_item_ids = [1, 3, 5, 21]  # Item IDs rated before time t-1\n",
    "# item_id_to_rate = 26  # Item ID to rate at time t\n",
    "\n",
    "# # Combine the rated item IDs and the item ID to rate\n",
    "# item_ids_input = rated_item_ids + [item_id_to_rate]\n",
    "\n",
    "# # Get the number of unique items\n",
    "# n_items = max(item_ids_input) + 1\n",
    "\n",
    "# # Convert item IDs to one-hot vectors\n",
    "# item_ids_onehot = np.eye(n_items)[item_ids_input]\n",
    "# item_ids_input_tensor = torch.tensor(item_ids_onehot, dtype=torch.float32).unsqueeze(0)  # Add batch dimension\n",
    "\n",
    "# # Define hyperparameters\n",
    "# input_size = n_items  # Input size is now equal to the number of unique items\n",
    "# hidden_size = 128\n",
    "# output_size = 1  # Assuming you're predicting a single rating\n",
    "# learning_rate = 0.001\n",
    "# num_epochs = 100\n",
    "\n",
    "# # Initialize your model\n",
    "# model_rnn = StabilityRNN(input_size, hidden_size, output_size)\n",
    "\n",
    "# # # Define loss function and optimizer\n",
    "# # criterion = nn.MSELoss()\n",
    "# # optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n",
    "\n",
    "# print(model_rnn(item_ids_input_tensor)[0][0])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#I need to find the sequence of items and ratings that will cause the most shift"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "\n",
    "def tensor_difference_metric(tensor1, tensor2):\n",
    "    # Create a tensor to store indices of elements in tensor2\n",
    "    indices_tensor = torch.arange(tensor2.size(0)).repeat(tensor2.size(0), 1)\n",
    "\n",
    "    # Mask the indices_tensor where tensor2 values match tensor1 values\n",
    "    mask = (tensor2.unsqueeze(1) == tensor1.unsqueeze(0))#.float()\n",
    "    masked_indices_tensor = indices_tensor * mask\n",
    "\n",
    "    # Calculate the sum of indices for each element in tensor1\n",
    "    #pdb.set_trace()\n",
    "    sum_indices = masked_indices_tensor.sum(dim=1).float()\n",
    "    abs_diff_sum = torch.sum(torch.abs(torch.arange(tensor1.size(0)).float() - sum_indices))#.sum().item()\n",
    "    #print(type(abs_diff_sum))\n",
    "    average_abs_diff = abs_diff_sum / tensor1.size(0)\n",
    "\n",
    "    return average_abs_diff\n",
    "\n",
    "# Example usage\n",
    "tensor1 = torch.tensor([1, 2, 3, 5, 4])\n",
    "tensor2 = torch.tensor([1, 2, 3, 4, 5])\n",
    "difference_metric = tensor_difference_metric(tensor1, tensor2)\n",
    "print(\"Difference Metric:\", difference_metric)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "candidate_items = []\n",
    "for i in sorted_items:\n",
    "    candidate_items.append(i[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_vector = torch.tensor(model.pu[uid])\n",
    "already_rated = list(user_item_rating_dict[uid].keys())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_items= len(model.qi)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "input_size = 100 #n_items  # Input size is now equal to the number of unique items\n",
    "hidden_size = 64 #128\n",
    "output_size = 1  # Assuming you're predicting a single rating\n",
    "learning_rate = 0.001\n",
    "num_epochs = 100\n",
    "\n",
    "# Initialize your model\n",
    "model_rnn = StabilityRNN(input_size, hidden_size, output_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Choose an adversarial user at random\n",
    "enemy_id = random.choice(other_users)\n",
    "n_epochs = 2000\n",
    "time_limit = 10\n",
    "optimizer = torch.optim.Adam(model_rnn.parameters(), lr=0.08)\n",
    "#okay now go over epochs\n",
    "initial_rec_list = get_all_preferences(user_vector, already_rated)\n",
    "for epoch in range(0,n_epochs):\n",
    "    #okay now I will be looking at a sequence of 10 items\n",
    "    history=[]\n",
    "    #set candidate items here\n",
    "    #set item_vector_copy here\n",
    "    for t in range(0,time_limit):\n",
    "        #okay now let's choose an item at random\n",
    "        curr_item = random.choice(candidate_items)\n",
    "        #now remove it from candidate items\n",
    "        history.append(curr_item)\n",
    "        item_ids_onehot = np.eye(n_items)[history]\n",
    "        item_ids_input_tensor = torch.tensor(item_ids_onehot, dtype=torch.float32).unsqueeze(0)  # Add batch dimension\n",
    "        curr_rating = model_rnn(item_ids_input_tensor)[0][0]\n",
    "        user_list = item_user_matrix[curr_item].keys()\n",
    "        rating_list = item_user_matrix[curr_item].values()\n",
    "        if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            rating_list.append(curr_rating)\n",
    "        else:\n",
    "            ind = user_list.index(enemy_id)\n",
    "            rating_list[ind] = curr_rating\n",
    "        item_vector_copy[curr_item] = update_item_tensor(item_vector_copy[curr_item], user_list, rating_list)\n",
    "    final_rec_list = get_all_preferences(user_vector, already_rated)\n",
    "    distance_metric = list_difference_metric(initial_rec_list, final_rec_list)\n",
    "    distance_metric.backward()\n",
    "    optimizer.step()\n",
    "    \n",
    "    optimizer.zero_grad()\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Choose an adversarial user at random\n",
    "enemy_id = random.choice(other_users)\n",
    "n_epochs = 2000\n",
    "time_limit = 10\n",
    "optimizer = torch.optim.Adam(model_rnn.parameters(), lr=0.08)\n",
    "#okay now go over epochs\n",
    "initial_rec_list = get_all_preferences(user_vector, torch.from_numpy(item_vector_copy_np), already_rated)\n",
    "for epoch in tqdm(range(0,n_epochs)):\n",
    "    #okay now I will be looking at a sequence of 10 items\n",
    "    history=torch.zeros(time_limit, dtype=torch.int64)\n",
    "    #set candidate items here\n",
    "    candidate_items = [i for i in range(0,n_items)]\n",
    "    #set item_vector_copy here\n",
    "    item_vector_copy = torch.from_numpy(item_vector_copy_np)\n",
    "    for t in range(0,time_limit):\n",
    "        #okay now let's choose an item at random\n",
    "        curr_item = random.choice(candidate_items)\n",
    "        #now remove it from candidate items\n",
    "        candidate_items.remove(curr_item)\n",
    "        history[t] = curr_item\n",
    "        #print(history[:t+1])\n",
    "        item_ids_onehot = torch.eye(n_items)[history[:t+1]]\n",
    "        item_ids_input_tensor = item_ids_onehot.unsqueeze(0)  # Add batch dimension\n",
    "        curr_rating = model_rnn(item_ids_input_tensor)[0][0]\n",
    "        user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        rating_list = [item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            rating_list.append(curr_rating)\n",
    "        else:\n",
    "            ind = user_list.index(enemy_id)\n",
    "            rating_list[ind] = curr_rating\n",
    "        item_vector_copy[curr_item] = update_item_tensor(item_vector_copy[curr_item], user_list, torch.tensor(rating_list, dtype=torch.float64))\n",
    "    final_rec_list = get_all_preferences(user_vector, item_vector_copy, already_rated)\n",
    "    distance_metric = tensor_difference_metric(initial_rec_list, final_rec_list)\n",
    "    distance_metric.requires_grad = True\n",
    "    distance_metric.backward()\n",
    "    optimizer.step()\n",
    "    \n",
    "    optimizer.zero_grad()\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_ids_onehot = torch.eye(n_items)[[2,3,5]]\n",
    "item_ids_input_tensor = item_ids_onehot.unsqueeze(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_ids_input_tensor.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.save(model_rnn.state_dict(), 'stability_predictor.pth')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay so now I have a model that given an adversarial user and their rating history so far can change the rating of the current item under consideration to\n",
    "#the rating that will most affect my primary user's recommendation list\n",
    "#so this model is trained on a particular adversarial user\n",
    "#I need to find the sequence of ratings by the adversarial user that can change my primary user's rating the most\n",
    "#can I do it in a greedy manner?"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "time_limit = 10\n",
    "history=torch.zeros(time_limit, dtype=torch.int64)\n",
    "initial_rec_list = get_all_preferences(user_vector, torch.from_numpy(item_vector_copy_np), already_rated)\n",
    "for t in range(0, time_limit):\n",
    "    best_item = -1\n",
    "    best_val = -1\n",
    "    for i in range(0,n_items):\n",
    "        history[t] = i\n",
    "        item_ids_onehot = torch.eye(n_items)[history[:t+1]]\n",
    "        item_ids_input_tensor = item_ids_onehot.unsqueeze(0)  # Add batch dimension\n",
    "        curr_rating = model_rnn(item_ids_input_tensor)[0][0]\n",
    "        user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        rating_list = [item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            rating_list.append(curr_rating)\n",
    "        else:\n",
    "            ind = user_list.index(enemy_id)\n",
    "            rating_list[ind] = curr_rating\n",
    "        item_vector_copy[curr_item] = update_item_tensor(item_vector_copy[curr_item], user_list, torch.tensor(rating_list, dtype=torch.float64))\n",
    "        final_rec_list = get_all_preferences(user_vector, already_rated)\n",
    "        distance_metric = tensor_difference_metric(initial_rec_list, final_rec_list)        \n",
    "        if distance_metric>best_val:\n",
    "            best_item = i\n",
    "            best_val = distance_metric\n",
    "    history[t] = best_item"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(history)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "[item_user_matrix[5][i][0] for i in range(len(item_user_matrix[5]))]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.tensor([item_vector_copy_np[2], item_vector_copy_np[2]]).shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def append_to_history(history, item_tensor):\n",
    "    # If history is None, initialize it with the shape of item_tensor\n",
    "    if history is None:\n",
    "        history = item_tensor.unsqueeze(0).unsqueeze(0)\n",
    "    else:\n",
    "        # Otherwise, append item_tensor along the second dimension of history\n",
    "        item_tensor = item_tensor.unsqueeze(0).unsqueeze(0)\n",
    "        # print(item_tensor)\n",
    "        # print(history)\n",
    "        history = torch.cat((history, item_tensor), dim=1)\n",
    "    return history"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Choose an adversarial user at random\n",
    "enemy_id = random.choice(other_users)\n",
    "enemy_vector = torch.tensor(model.pu[enemy_id])\n",
    "n_epochs = 1000\n",
    "time_limit = 10\n",
    "optimizer = torch.optim.Adam(model_rnn.parameters(), lr=0.08)\n",
    "#okay now go over epochs\n",
    "initial_rec_list = get_all_preferences(user_vector, torch.from_numpy(item_vector_copy_np), already_rated)\n",
    "for epoch in tqdm(range(0,n_epochs)):\n",
    "    #okay now I will be looking at a sequence of 10 items\n",
    "    history=torch.zeros(time_limit, dtype=torch.int64)\n",
    "    history_vectors = None\n",
    "    #set candidate items here\n",
    "    candidate_items = [i for i in range(0,n_items)]\n",
    "    #set item_vector_copy here\n",
    "    item_vector_copy = torch.from_numpy(item_vector_copy_np)\n",
    "    enemy_already_rated = list(user_item_rating_dict[enemy_id].keys())\n",
    "    for t in range(0,time_limit):\n",
    "        #okay now let's choose an item at random\n",
    "        a, b = get_recommendation_scores(enemy_vector, enemy_already_rated)#item recommended to you #random.choice(candidate_items)\n",
    "        curr_item, curr_score = a[0], b[0]\n",
    "        enemy_already_rated.append(curr_item)\n",
    "        #now remove it from candidate items\n",
    "        candidate_items.remove(curr_item)\n",
    "        history[t] = curr_item\n",
    "        history_vectors = append_to_history(history_vectors, item_vector_copy[curr_item])\n",
    "        #print(history[:t+1])\n",
    "        # item_ids_onehot = torch.eye(n_items)[history[:t+1]]\n",
    "        #item_ids_input_tensor = item_vector_copy[curr_item]  # Add batch dimension\n",
    "        curr_rating = model_rnn(history_vectors)[0][0]\n",
    "        user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        rating_list = [item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))]\n",
    "        if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            rating_list.append(curr_rating)\n",
    "        else:\n",
    "            ind = user_list.index(enemy_id)\n",
    "            rating_list[ind] = curr_rating\n",
    "        item_vector_copy[curr_item] = update_item_tensor(item_vector_copy[curr_item], user_list, torch.tensor(rating_list, dtype=torch.float64))\n",
    "    final_rec_list = get_all_preferences(user_vector, item_vector_copy, already_rated)\n",
    "    distance_metric = tensor_difference_metric(initial_rec_list, final_rec_list)\n",
    "    distance_metric.requires_grad = True\n",
    "    distance_metric.backward()\n",
    "    optimizer.step()\n",
    "    \n",
    "    optimizer.zero_grad()\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.save(model_rnn.state_dict(), 'stability_predictor_rec_policy.pth')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "input_size = 100 #n_items  # Input size is now equal to the number of unique items\n",
    "hidden_size = 64 #128\n",
    "output_size = 1  # Assuming you're predicting a single rating\n",
    "learning_rate = 0.001\n",
    "num_epochs = 100\n",
    "\n",
    "# Initialize your model\n",
    "model_rnn = StabilityRNN(input_size, hidden_size, output_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model_rnn.load_state_dict(torch.load('stability_predictor_rec_policy.pth'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import numpy as np\n",
    "\n",
    "# Define your RNN model\n",
    "class StabilityRNN1(nn.Module):\n",
    "    def __init__(self, input_size, hidden_size, output_size):\n",
    "        super(StabilityRNN1, self).__init__()\n",
    "        self.hidden_size = hidden_size\n",
    "        self.rnn = nn.RNN(input_size + 100, hidden_size, batch_first=True)\n",
    "        self.fc = nn.Linear(hidden_size, output_size)\n",
    "\n",
    "    def forward(self, x, enemy_vector):\n",
    "        x = torch.cat((x, enemy_vector.unsqueeze(0).repeat(x.size(0), 1)), dim=2)\n",
    "        out, _ = self.rnn(x)\n",
    "        out = self.fc(out[:, -1, :])\n",
    "        return out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "enemy_vector = torch.tensor(model.pu[4])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "input_size = 100 #n_items  # Input size is now equal to the number of unique items\n",
    "hidden_size = 64 #128\n",
    "output_size = 1  # Assuming you're predicting a single rating\n",
    "learning_rate = 0.001\n",
    "num_epochs = 100\n",
    "\n",
    "# Initialize your model\n",
    "model_rnn1 = StabilityRNN1(input_size, hidden_size, output_size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#TESTING FUTURE STABILITY HERE. INCOMPLETE CODE, COME BACK LATER.\n",
    "\n",
    "\n",
    "#Choose an adversarial user at random\n",
    "enemy_ids = random.sample(other_users, 10)\n",
    "n_epochs = 1000\n",
    "time_limit = 5\n",
    "optimizer = torch.optim.Adam(model_rnn1.parameters(), lr=0.08)\n",
    "#okay now go over epochs\n",
    "initial_rec_list = get_all_preferences(user_vector, torch.from_numpy(item_vector_copy_np), already_rated)\n",
    "for epoch in tqdm(range(0, n_epochs)):\n",
    "    for enemy_id in enemy_ids:\n",
    "        enemy_vector = model.pu[enemy_id]\n",
    "        #okay now I will be looking at a sequence of 10 items\n",
    "        history=torch.zeros(time_limit, dtype=torch.int64)\n",
    "        history_vectors = None\n",
    "        #set candidate items here\n",
    "        candidate_items = [i for i in range(0,n_items)]\n",
    "        #set item_vector_copy here\n",
    "        item_vector_copy = torch.from_numpy(item_vector_copy_np)\n",
    "        enemy_already_rated = list(user_item_rating_dict[enemy_id].keys())\n",
    "        for t in range(0,time_limit):\n",
    "            #okay now let's choose an item at random\n",
    "            a, b = get_recommendation_scores(enemy_vector, enemy_already_rated)#item recommended to you #random.choice(candidate_items)\n",
    "            curr_item, curr_score = a[0], b[0]\n",
    "            enemy_already_rated.append(curr_item)\n",
    "            #now remove it from candidate items\n",
    "            candidate_items.remove(curr_item)\n",
    "            history[t] = curr_item\n",
    "            history_vectors = append_to_history(history_vectors, item_vector_copy[curr_item])\n",
    "            #print(history[:t+1])\n",
    "            # item_ids_onehot = torch.eye(n_items)[history[:t+1]]\n",
    "            #item_ids_input_tensor = item_vector_copy[curr_item]  # Add batch dimension\n",
    "            curr_rating = model_rnn(history_vectors)[0][0]\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = [item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            if enemy_id not in user_list:\n",
    "                user_list.append(enemy_id)\n",
    "                rating_list.append(curr_rating)\n",
    "            else:\n",
    "                ind = user_list.index(enemy_id)\n",
    "                rating_list[ind] = curr_rating\n",
    "            item_vector_copy[curr_item] = update_item_tensor(item_vector_copy[curr_item], user_list, torch.tensor(rating_list, dtype=torch.float64))\n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy, already_rated)\n",
    "        distance_metric = tensor_difference_metric(initial_rec_list, final_rec_list)\n",
    "        distance_metric.requires_grad = True\n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        \n",
    "        optimizer.zero_grad()\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#PAST STABILITY\n",
    "#CHOOSE 10 RANDOM USERS AS ADVERSARIES\n",
    "#NOW LETS LOOK AT THE PAST-1-STABILITY OF INFLUENTIAL AND MID USERS TO THEIR ACTIONS\n",
    "#PARAMETER SPACE WILL BE 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_users = list(range(n_users))\n",
    "\n",
    "# Filter out numbers present in influential_users or mid_users\n",
    "available_users = [i for i in all_users if i not in top_influential_users and i not in mid_users]\n",
    "\n",
    "# Choose 10 random items from the available items\n",
    "chosen_users = random.sample(available_users, 10)\n",
    "\n",
    "print(chosen_users)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items = [list(user_item_rating_dict[u].keys())[-1] for u in chosen_users]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings = [list(user_item_rating_dict[u].values())[-1] for u in chosen_users]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings = [torch.tensor(item) for item in chosen_ratings]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_one_ = model_last_item.qi.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_one = torch.from_numpy(item_vector_copy_one_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_one_changed_ = model_last_item.qi.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_one_changed = torch.from_numpy(item_vector_copy_one_changed_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_user_matrix = trainset1.ir"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_item_matrix = trainset1.ur"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_item_rating_dict = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in user_item_matrix.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def get_all_preferences(user_vector, item_vector_copy_h, already_rated):\n",
    "#     n_items = len(item_vector_copy_h)\n",
    "#     predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "#     for item in range(0, n_items):\n",
    "#         item_rating = user_vector @ item_vector_copy_h[item]\n",
    "#         predicted_ratings[item] = item_rating\n",
    "#     sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "#     count_var = 0\n",
    "#     unrated_item_names=[]\n",
    "#     for i in sorted_pred_ratings:\n",
    "#         item_id = i[0]\n",
    "#         if item_id not in already_rated:\n",
    "#             count_var+=1\n",
    "#             unrated_item_names.append(item_id)\n",
    "#     return torch.tensor(unrated_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 3703 items\n",
    "# 5 items\n",
    "# 3698\n",
    "#\n",
    "\n",
    "def get_all_preferences(user_vector_1, item_vector_copy_h):\n",
    "    # Compute ratings for each item by dot product with user_vector\n",
    "    item_ratings = torch.matmul(item_vector_copy_h, user_vector_1.unsqueeze(1))\n",
    "    return item_ratings.squeeze(1) \n",
    "\n",
    "# def get_all_preferences(user_vector, item_vector_copy_h, already_rated):\n",
    "#     item_ratings = torch.matmul(item_vector_copy_h, user_vector.unsqueeze(1)).squeeze(1)\n",
    "#     sorted_indices = torch.argsort(item_ratings, descending=True)\n",
    "    \n",
    "#     # # Create a mask indicating whether each item is already rated\n",
    "#     # mask = torch.zeros_like(item_ratings, dtype=torch.bool)\n",
    "#     # mask[already_rated] = True\n",
    "    \n",
    "#     # # Filter out the indices of items that are not already rated\n",
    "#     # unrated_indices = sorted_indices[~mask]\n",
    "    \n",
    "#     return sorted_indices\n",
    "\n",
    "# def get_all_preferences(user_vector, item_vector_copy, already_rated):\n",
    "#     predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "#     for item in range(0, n_items):\n",
    "#         item_rating = user_vector @ torch.tensor(item_vector_copy[item])\n",
    "#         predicted_ratings[item] = item_rating\n",
    "#     sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "#     count_var = 0\n",
    "#     unrated_item_names=[]\n",
    "#     for i in sorted_pred_ratings:\n",
    "#         item_id = i[0]\n",
    "#         if item_id not in already_rated:\n",
    "#             count_var+=1\n",
    "#             unrated_item_names.append(item_id)\n",
    "#     return torch.tensor(unrated_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_item_tensor(item_vector, users, ratings):\n",
    "    Q_list = [model_last_item.pu[user] for user in users]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mse = torch.nn.MSELoss()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_1 = []\n",
    "for u in top_influential_users:\n",
    "    user_vector = torch.tensor(model_last_item.pu[u])\n",
    "    already_rated = list(user_item_rating_dict[u].keys())\n",
    "    chosen_ratings_opt = chosen_ratings.copy()\n",
    "    for param in chosen_ratings_opt:\n",
    "        param.requires_grad_(True)\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy_one)\n",
    "    #initial_rec_list.requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam(chosen_ratings_opt, lr=0.08)\n",
    "    #print(initial_rec_list)\n",
    "    n_epochs = 50\n",
    "    curr_stability = None\n",
    "    distance_metric2 = None\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        item_vector_copy_one_changed_ = model_last_item.qi.copy()\n",
    "        item_vector_copy_one_changed = torch.from_numpy(item_vector_copy_one_changed_)\n",
    "        for enemy_num in range(0,1):\n",
    "            enemy_id = chosen_users[enemy_num]\n",
    "            curr_item = chosen_items[enemy_num]\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "            #if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            #rating_list.append(chosen_ratings_opt[enemy_num])\n",
    "            rating_list = torch.cat((rating_list, chosen_ratings_opt[enemy_num].unsqueeze(0)), dim=0)\n",
    "            # else:\n",
    "            #     ind = user_list.index(enemy_id)\n",
    "            #     rating_list[ind] = chosen_ratings_opt[enemy_num]\n",
    "            item_vector_copy_one_changed[curr_item] = update_item_tensor(item_vector_copy_one_changed[curr_item], user_list, rating_list)\n",
    "        \n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_one_changed)\n",
    "        distance_metric2 = -mse(final_rec_list,initial_rec_list)#-torch.norm(final_rec_list - initial_rec_list, p=2)#-tensor_difference_metric(initial_rec_list, final_rec_list)#+sum(chosen_ratings_opt)\n",
    "        #distance_metric.requires_grad_()\n",
    "        print(distance_metric2)\n",
    "        #print(distance_metric.grad)\n",
    "        \n",
    "        distance_metric2.backward()\n",
    "        print(final_rec_list.grad)\n",
    "        # for kk in range(0,len(chosen_ratings_opt)):\n",
    "        #     print(chosen_ratings_opt[kk].grad)\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "        \n",
    "    \n",
    "    curr_stability = distance_metric2.item()\n",
    "    all_stability_1.append(curr_stability)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "1/(sum(all_stability_1)/10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_2 = []\n",
    "for u in mid_users:\n",
    "    user_vector = torch.tensor(model_last_item.pu[u])\n",
    "    already_rated = list(user_item_rating_dict[u].keys())\n",
    "    chosen_ratings_opt = chosen_ratings.copy()\n",
    "    for param in chosen_ratings_opt:\n",
    "        param.requires_grad_(True)\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy_one)\n",
    "    optimizer = torch.optim.Adam(chosen_ratings_opt, lr=0.08)\n",
    "    n_epochs = 50\n",
    "    curr_stability = None\n",
    "    distance_metric2 = None\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        item_vector_copy_one_changed_ = model_last_item.qi.copy()\n",
    "        item_vector_copy_one_changed = torch.from_numpy(item_vector_copy_one_changed_)\n",
    "        for enemy_num in range(0,1):\n",
    "            enemy_id = chosen_users[enemy_num]\n",
    "            curr_item = chosen_items[enemy_num]\n",
    "            #print(chosen_ratings_opt[enemy_num].requires_grad)\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "            #if enemy_id not in user_list:\n",
    "            user_list.append(enemy_id)\n",
    "            #rating_list.append(chosen_ratings_opt[enemy_num])\n",
    "            rating_list = torch.cat((rating_list, chosen_ratings_opt[enemy_num].unsqueeze(0)), dim=0)\n",
    "            # else:\n",
    "            #     ind = user_list.index(enemy_id)\n",
    "            #     rating_list[ind] = chosen_ratings_opt[enemy_num]\n",
    "            item_vector_copy_one_changed[curr_item] = update_item_tensor(item_vector_copy_one_changed[curr_item], user_list, rating_list)\n",
    "        \n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_one_changed)\n",
    "        distance_metric2 = -mse(final_rec_list,initial_rec_list)#-torch.norm(final_rec_list - initial_rec_list, p=2)#-tensor_difference_metric(initial_rec_list, final_rec_list)#+sum(chosen_ratings_opt)\n",
    "        print(distance_metric2) \n",
    "        distance_metric2.backward()\n",
    "        print(final_rec_list.grad)\n",
    "        # for kk in range(0,len(chosen_ratings_opt)):\n",
    "        #     print(chosen_ratings_opt[kk].grad)\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "        \n",
    "    \n",
    "    curr_stability = distance_metric2.item()\n",
    "    all_stability_2.append(curr_stability)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "1/(sum(all_stability_2)/10) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_vector_copy_one.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "type(item_vector_copy_one)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_stability_1 = []\n",
    "for u in mid_users:\n",
    "    user_vector = torch.tensor(model_last_item.pu[u])\n",
    "    already_rated = list(user_item_rating_dict[u].keys())\n",
    "    tensor1 = get_all_preferences(user_vector, torch.from_numpy(item_vector_copy_one), already_rated)\n",
    "    optimizer = torch.optim.Adam(chosen_ratings, lr=0.08)\n",
    "    #print(initial_rec_list)\n",
    "    n_epochs = 50\n",
    "    curr_stability = 0\n",
    "    distance_metric = torch.tensor(0.) \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        for enemy_num in range(0,len(chosen_users)):\n",
    "            enemy_id = chosen_users[enemy_num]\n",
    "            curr_item = chosen_items[enemy_num]\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = [item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            if enemy_id not in user_list:\n",
    "                user_list.append(enemy_id)\n",
    "                rating_list.append(chosen_ratings[enemy_num])\n",
    "            else:\n",
    "                ind = user_list.index(enemy_id)\n",
    "                rating_list[ind] = chosen_ratings[enemy_num]\n",
    "            item_vector_copy_one_changed[curr_item] = update_item_tensor(item_vector_copy_one_changed[curr_item], user_list, torch.tensor(rating_list, dtype=torch.float64))\n",
    "        tensor2 = get_all_preferences(user_vector, item_vector_copy_one_changed, already_rated)\n",
    "        #print(final_rec_list)\n",
    "        #distance_metric = tensor_difference_metric(initial_rec_list, final_rec_list)\n",
    "        indices_tensor = torch.arange(tensor2.size(0)).repeat(tensor2.size(0), 1)\n",
    "\n",
    "        # Mask the indices_tensor where tensor2 values match tensor1 values\n",
    "        mask = (tensor2.unsqueeze(1) == tensor1.unsqueeze(0))#.float()\n",
    "        #print(mask)\n",
    "        masked_indices_tensor = indices_tensor * mask\n",
    "\n",
    "        # Calculate the sum of indices for each element in tensor1\n",
    "        sum_indices = masked_indices_tensor.sum(dim=1)\n",
    "        # Calculate the average absolute difference\n",
    "        abs_diff_sum = torch.sum(torch.abs(torch.arange(tensor1.size(0)).float() - sum_indices))#.sum().item()\n",
    "        #print(type(abs_diff_sum))\n",
    "        average_abs_diff = abs_diff_sum / tensor1.size(0)\n",
    "        print(average_abs_diff)\n",
    "        average_abs_diff.backward()\n",
    "        optimizer.step()\n",
    "        \n",
    "        optimizer.zero_grad()\n",
    "    curr_stability = distance_metric\n",
    "    all_stability_1.append(curr_stability.item())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Attempting to replicate results in Stochastic Reachability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#5 is the user we are looking at\n",
    "item_and_rating =  trainset.ur[5][-1]\n",
    "chosen_items = [item_and_rating[0]]\n",
    "chosen_ratings = [item_and_rating[1]]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_action = torch.tensor(chosen_ratings)\n",
    "print(user_action)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lookup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "desired_key = None\n",
    "for key, value in user_lookup.items():\n",
    "    if value == 5:\n",
    "        desired_key = key\n",
    "        break\n",
    "\n",
    "if desired_key is not None:\n",
    "    print(\"Key with value 5:\", desired_key)\n",
    "else:\n",
    "    print(\"Value 5 not found in the dictionary.\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-history\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 14#6\n",
    "function_vals=[]\n",
    "action_vals=[]\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model_last_item.pu[5])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 1\n",
    "    already_rated = list(user_item_rating_dict[5].keys())\n",
    "    already_rated = already_rated[:-1]\n",
    "    ratings_old = rating_tensor[:-1]\n",
    "    n = len(ratings_old)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "    # del ratings[chosen_item]\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        curr_item = chosen_items[timestep]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item_to_be_reached])))\n",
    "    print(abs(item_rating))\n",
    "    function_vals.append(item_rating.item())\n",
    "    action_vals.append(user_action[0].item())\n",
    "    item_rating.backward()\n",
    "    print(user_action)\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "action_vals"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "function_vals"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.plot(action_vals, function_vals, marker='o', linestyle='-')\n",
    "plt.xlabel('Action Values')\n",
    "plt.ylabel('Function Values')\n",
    "plt.title('Plot of Function Values vs Action Values')\n",
    "plt.grid(True)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_action"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Ok now I replicate it by using movielens100k instead"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "file_path = \"../datasets/ml-100k/u.data\"\n",
    "\n",
    "# Load the dataset into a DataFrame\n",
    "df_100k = pd.read_csv(file_path, sep='\\t', header=None, names=['user_id', 'item_id', 'rating', 'timestamp'])\n",
    "\n",
    "# Display the first few rows of the DataFrame\n",
    "print(df_100k.head())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Load the movielens-100k dataset (download it if needed),\n",
    "# and split it into 3 folds for cross-validation.\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(df_100k[['user_id', 'item_id', 'rating']], reader)\n",
    "\n",
    "model_100k_full = SVD(biased=False)\n",
    "\n",
    "# # Perform cross-validation\n",
    "cv_results = cross_validate(model_100k_full, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# # Print the cross-validation results\n",
    "for measure in ['test_rmse', 'test_mae']:\n",
    "    print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset_100k = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "model_100k_full.fit(trainset_100k)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )\n",
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df\n",
    "mark_last_n_ratings_as_validation_set(df_100k, 1)\n",
    "train_df = df_100k[df_100k.is_valid==False]\n",
    "valid_df = df_100k[df_100k.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(train_df[['user_id', 'item_id', 'rating']], reader)\n",
    "\n",
    "model_last_item_100k = SVD(biased=False)\n",
    "\n",
    "# Perform cross-validation\n",
    "cv_results = cross_validate(model_last_item_100k, data, measures=['RMSE', 'MAE'], cv=5, verbose=True)\n",
    "\n",
    "# Print the cross-validation results\n",
    "for measure in ['test_rmse', 'test_mae']:\n",
    "    print(f\"{measure}: {cv_results[measure].mean()}\")\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset_100k_one = data.build_full_trainset()\n",
    "\n",
    "# Train the model on the whole dataset\n",
    "model_last_item.fit(trainset_100k_one)\n",
    "#change name\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k.n_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.n_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.to_inner_uid(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k.to_inner_uid(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#5 is the user we are looking at\n",
    "item_and_rating =  trainset_100k.ur[111][-1]\n",
    "chosen_items = [trainset_100k_one.to_inner_iid(trainset_100k.to_raw_iid(item_and_rating[0]))]\n",
    "chosen_ratings = [item_and_rating[1]]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.to_raw_iid(chosen_items[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "chosen_ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_action = torch.tensor(chosen_ratings)\n",
    "print(user_action)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.ur"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "user_item_rating_dict = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in trainset_100k_one.ur.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# desired_key = None\n",
    "# for key, value in user_lookup.items():\n",
    "#     if value == 5:\n",
    "#         desired_key = key\n",
    "#         break\n",
    "\n",
    "# if desired_key is not None:\n",
    "#     print(\"Key with value 5:\", desired_key)\n",
    "# else:\n",
    "#     print(\"Value 5 not found in the dictionary.\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings = user_item_rating_dict[110]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in ratings:\n",
    "    ratings[i]=torch.tensor(ratings[i], dtype=torch.float64)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "rating_tensor = torch.tensor(list(ratings.values()))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_dict = ratings"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay so things I need for this are:\n",
    "#list of ratings they've given so far(ratings tensor)\n",
    "#old model(minus one item for every user)\n",
    "\n",
    "#they are not updating item vectors?\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "already_rated = list(user_item_rating_dict[110].keys())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(already_rated)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.to_inner_uid(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k_one.to_raw_iid(7)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#now allow changing history for multiple items at the initial time?\n",
    "#so param is a list of numbers where each number is the rating given by the user to every item they have rated?\n",
    "#okay can I fix the item choice but change the rating?\n",
    "#this is more sensible\n",
    "# import wandb\n",
    "# wandb.init(project=\"reachability-multi-history\", name=\"run_1_lr_0.08\")\n",
    "\n",
    "#Stochastic choice\n",
    "user_action = torch.tensor(chosen_ratings, requires_grad=True)\n",
    "optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "item_to_be_reached = 7\n",
    "function_vals=[]\n",
    "action_vals=[]\n",
    "for epoch in range(1, 50):\n",
    "    user_action_clamped = user_action.clamp(1, 5)\n",
    "    rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "    user_vector_initial = torch.from_numpy(model_last_item.pu[110])\n",
    "    user_vector = user_vector_initial\n",
    "    time_max = 1\n",
    "    already_rated = list(user_item_rating_dict[110].keys())\n",
    "    # already_rated = already_rated[:-1]\n",
    "    # ratings_old = rating_tensor[:-1]\n",
    "    n = len(rating_tensor)\n",
    "    zeros_to_add = torch.zeros(time_max)\n",
    "    ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "    # del ratings[chosen_item]\n",
    "    for timestep in tqdm(range(0,time_max)):\n",
    "        curr_item = chosen_items[timestep]\n",
    "        ratings[n+timestep] = user_action_clamped[timestep]\n",
    "        already_rated.append(curr_item)\n",
    "        user_vector = update_user_tensor_single(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "    partition_function = sum(torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[partition_item]))) for partition_item in range(len(model_last_item.qi)))\n",
    "    item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_last_item.qi[item_to_be_reached])))/partition_function\n",
    "    print(abs(item_rating))\n",
    "    function_vals.append(item_rating.item())\n",
    "    action_vals.append(user_action[0].item())\n",
    "    item_rating.backward()\n",
    "    print(user_action)\n",
    "    optimizer.step()\n",
    "    optimizer.zero_grad()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset_100k.to_inner_uid(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#baseline reachability\n",
    "user_vector_initial = torch.from_numpy(model_100k_full.pu[111])\n",
    "user_vector = user_vector_initial\n",
    "partition_function = sum(torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_100k_full.qi[partition_item]))) for partition_item in range(len(model_last_item.qi)))\n",
    "print(torch.exp(0.8*torch.matmul(user_vector, torch.from_numpy(model_100k_full.qi[item_to_be_reached])))/partition_function)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_to_be_reached"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
