{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Test Notebook\n",
    "!ls"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "# Specify the file paths for the dataset files\n",
    "users_path = \"../datasets/ml-1m/users.dat\"\n",
    "ratings_path = \"../datasets/ml-1m/ratings.dat\"\n",
    "movies_path = \"../datasets/ml-1m/movies.dat\"\n",
    "\n",
    "\n",
    "# Define column names for each dataset\n",
    "users_cols = ['user_id', 'gender', 'age', 'occupation', 'zip_code']\n",
    "ratings_cols = ['user_id', 'movie_id', 'rating', 'timestamp']\n",
    "movies_cols = ['movie_id', 'title', 'genres']\n",
    "\n",
    "# Load data into Pandas DataFrames\n",
    "users_df = pd.read_csv(users_path, sep='::', header=None, names=users_cols, encoding='latin-1', engine='python')\n",
    "ratings_df = pd.read_csv(ratings_path, sep='::', header=None, names=ratings_cols, encoding='latin-1', engine='python')\n",
    "movies_df = pd.read_csv(movies_path, sep='::', header=None, names=movies_cols, encoding='latin-1', engine='python')\n",
    "\n",
    "# Display the first few rows of each DataFrame\n",
    "print(\"Users DataFrame:\")\n",
    "print(users_df.head())\n",
    "\n",
    "print(\"\\nRatings DataFrame:\")\n",
    "print(ratings_df.head())\n",
    "\n",
    "print(\"\\nMovies DataFrame:\")\n",
    "print(movies_df.head())\n",
    "\n",
    "# Optionally, convert DataFrames to NumPy arrays/matrices\n",
    "users_array = users_df.values\n",
    "ratings_array = ratings_df.values\n",
    "movies_array = movies_df.values\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df = pd.merge(ratings_df, movies_df)[['user_id', 'title', 'rating', 'timestamp']]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df[\"user_id\"] = ratings_df[\"user_id\"].astype(str)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lookup = {v: i+1 for i, v in enumerate(ratings_df['user_id'].unique())}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "movie_lookup = {v: i+1 for i, v in enumerate(ratings_df['title'].unique())}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_df['movie_id'] = ratings_df['title'].map(movie_lookup)\n",
    "ratings_df['user_int'] = ratings_df['user_id'].map(user_lookup)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "ratings_per_user = ratings_df.groupby('user_id').rating.count()\n",
    "ratings_per_item = ratings_df.groupby('movie_id').rating.count()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sorted_ratings_per_item = ratings_per_item.sort_values(ascending=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "l= [i for i in sorted_ratings_per_item[:30].keys()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "l"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_item_rating_tuples = ratings_df[['user_int', 'movie_id', 'rating']].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "min(ratings_df['movie_id'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(ratings_df[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset = data.build_full_trainset()\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "file_path = 'surprise_model_full.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Leave 1 out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )\n",
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df\n",
    "mark_last_n_ratings_as_validation_set(ratings_df, 1)\n",
    "train_df = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(train_df[['user_int', 'movie_id', 'rating']], reader)\n",
    "# Retrieve the trainset\n",
    "trainset1 = data.build_full_trainset()\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "file_path = 'surprise_model_last_item.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model_last_item = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_last_n_ratings_by_user(\n",
    "    df, n, min_ratings_per_user=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    return (\n",
    "        df.groupby(user_colname)\n",
    "        .filter(lambda x: len(x) >= min_ratings_per_user)\n",
    "        .sort_values(timestamp_colname)\n",
    "        .groupby(user_colname)\n",
    "        .tail(n)\n",
    "        .sort_values(user_colname)\n",
    "    )\n",
    "def mark_last_n_ratings_as_validation_set(\n",
    "    df, n, min_ratings=1, user_colname=\"user_id\", timestamp_colname=\"timestamp\"\n",
    "):\n",
    "    \"\"\"\n",
    "    Mark the chronologically last n ratings as the validation set.\n",
    "    This is done by adding the additional 'is_valid' column to the df.\n",
    "    :param df: a DataFrame containing user item ratings\n",
    "    :param n: the number of ratings to include in the validation set\n",
    "    :param min_ratings: only include users with more than this many ratings\n",
    "    :param user_id_colname: the name of the column containing user ids\n",
    "    :param timestamp_colname: the name of the column containing the imestamps\n",
    "    :return: the same df with the additional 'is_valid' column added\n",
    "    \"\"\"\n",
    "    df[\"is_valid\"] = False\n",
    "    df.loc[\n",
    "        get_last_n_ratings_by_user(\n",
    "            df,\n",
    "            n,\n",
    "            min_ratings,\n",
    "            user_colname=user_colname,\n",
    "            timestamp_colname=timestamp_colname,\n",
    "        ).index,\n",
    "        \"is_valid\",\n",
    "    ] = True\n",
    "\n",
    "    return df\n",
    "mark_last_n_ratings_as_validation_set(ratings_df, 5)\n",
    "train_df_5 = ratings_df[ratings_df.is_valid==False]\n",
    "valid_df_5 = ratings_df[ratings_df.is_valid==True]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import Dataset, Reader\n",
    "from surprise.model_selection import cross_validate\n",
    "from surprise import SVD\n",
    "from surprise import accuracy\n",
    "\n",
    "reader = Reader()\n",
    "data = Dataset.load_from_df(train_df_5[['user_int', 'movie_id', 'rating']], reader)\n",
    "\n",
    "# Retrieve the trainset\n",
    "trainset5 = data.build_full_trainset()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from surprise import dump\n",
    "\n",
    "file_path = 'surprise_model_last_five.dump'\n",
    "\n",
    "# Load the saved model\n",
    "_, model_last_five = dump.load(file_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the user-item rating matrix from the trainset\n",
    "user_item_matrix = trainset.ur\n",
    "total_triplets = sum(len(items) for items in user_item_matrix.values())\n",
    "\n",
    "print(\"Total Triplets:\", total_triplets)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the user-item rating matrix from the trainset\n",
    "user_item_matrix_1 = trainset1.ur\n",
    "total_triplets1 = sum(len(items) for items in user_item_matrix_1.values())\n",
    "\n",
    "print(\"Total Triplets:\", total_triplets1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the user-item rating matrix from the trainset\n",
    "user_item_matrix_5 = trainset5.ur\n",
    "total_triplets5 = sum(len(items) for items in user_item_matrix_5.values())\n",
    "\n",
    "print(\"Total Triplets:\", total_triplets5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Now to create the same lists we created earlier\n",
    "#already_rated list\n",
    "#popularity ranking list\n",
    "from collections import defaultdict\n",
    "\n",
    "item_occurrences = defaultdict(int)\n",
    "for items in user_item_matrix.values():\n",
    "    for item, _ in items:\n",
    "        item_occurrences[item] += 1\n",
    "\n",
    "# Step 2: Sort items by popularity\n",
    "sorted_items = sorted(item_occurrences.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "# Step 3: Assign ranks to items\n",
    "popularity_rank = {item: rank + 1 for rank, (item, _) in enumerate(sorted_items)}\n",
    "\n",
    "# Print the popularity ranks\n",
    "# for item, rank in popularity_rank.items():\n",
    "#     print(f\"Item {item} has popularity rank {rank}\")\n",
    "sorted_items[:10]\n",
    "#popularity_rank"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "user_item_rating_dict = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in user_item_matrix.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "user_item_rating_tensor = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for user_id, item_rating_dict in user_item_rating_dict.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    item_rating_list = list(item_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    item_rating_tensors = [torch.tensor([[item_id, rating]], dtype=torch.float) for item_id, rating in item_rating_list]\n",
    "    \n",
    "    # Stack the list of tensors along a new dimension to create a single tensor\n",
    "    item_rating_tensor = torch.stack(item_rating_tensors)\n",
    "    \n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    user_item_rating_tensor[user_id] = item_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "user_item_rating_dict1 = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in user_item_matrix_1.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict1[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "user_item_rating_tensor1 = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for user_id, item_rating_dict in user_item_rating_dict1.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    item_rating_list = list(item_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    item_rating_tensors = [torch.tensor([[item_id, rating]], dtype=torch.float) for item_id, rating in item_rating_list]\n",
    "    \n",
    "    # Stack the list of tensors along a new dimension to create a single tensor\n",
    "    item_rating_tensor = torch.stack(item_rating_tensors)\n",
    "    \n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    user_item_rating_tensor1[user_id] = item_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "user_item_rating_dict5 = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for user, items_ratings in user_item_matrix_5.items():\n",
    "    items_dict = {item: rating for item, rating in items_ratings}\n",
    "    user_item_rating_dict5[user] = items_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "user_item_rating_tensor5 = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for user_id, item_rating_dict in user_item_rating_dict5.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    item_rating_list = list(item_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    item_rating_tensors = [torch.tensor([[item_id, rating]], dtype=torch.float) for item_id, rating in item_rating_list]\n",
    "    \n",
    "    # Stack the list of tensors along a new dimension to create a single tensor\n",
    "    item_rating_tensor = torch.stack(item_rating_tensors)\n",
    "    \n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    user_item_rating_tensor5[user_id] = item_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def hellinger_distance(p, q):\n",
    "    return torch.sqrt(torch.sum((torch.sqrt(p) - torch.sqrt(q)) ** 2)) / torch.sqrt(torch.tensor(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_items = len(model.qi)\n",
    "n_users = len(model.pu)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#define user_type.choice\n",
    "#define user_type.rating\n",
    "import random\n",
    "class UserType:\n",
    "    def __init__(self, user_type, rec_scores, popularities, beta=0):\n",
    "        self.user_type = user_type\n",
    "        self.rec_scores = rec_scores\n",
    "        self.popularities = popularities\n",
    "        self.beta = beta\n",
    "        self.set_user_type_values()\n",
    "\n",
    "    def set_user_type_values(self):\n",
    "        if self.user_type == \"Enjoyer\":\n",
    "            self.item_choice = 0\n",
    "            self.item_rating = 5\n",
    "        elif self.user_type == \"Hater\":\n",
    "            self.item_choice = 0\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Random Enjoyer\":\n",
    "            self.item_choice = random.randint(0, len(self.rec_scores) - 1)\n",
    "            self.item_rating = 5\n",
    "        elif self.user_type == \"Random Hater\":\n",
    "            self.item_choice = random.randint(0, len(self.rec_scores) - 1)\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Choice Enjoyer\":\n",
    "            # probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            # probabilities /= probabilities.sum() \n",
    "            # self.item_choice = np.random.choice(len(self.rec_scores), p=probabilities)\n",
    "            # self.item_rating = 5\n",
    "            \n",
    "            probabilities = torch.softmax(torch.mul(self.rec_scores, self.beta), dim=0)\n",
    "\n",
    "            # Choose an item based on probabilities\n",
    "            self.item_choice = torch.multinomial(probabilities, 1).item()\n",
    "\n",
    "            # Set item rating to 5\n",
    "            self.item_rating = torch.tensor(5, dtype=torch.float64)\n",
    "        elif self.user_type == \"Choice Hater\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.rec_scores), p=probabilities)\n",
    "            self.item_rating = 1\n",
    "        elif self.user_type == \"Popular Enjoyer\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.values), p=probabilities)\n",
    "            if self.popularities[self.item_choice]<500:\n",
    "                self.item_rating = 5\n",
    "            else:\n",
    "                self.item_rating = 1\n",
    "        elif self.user_type == \"Niche Enjoyer\":\n",
    "            probabilities = np.exp(self.beta * np.array(self.rec_scores))\n",
    "            probabilities /= probabilities.sum() \n",
    "            self.item_choice = np.random.choice(len(self.values), p=probabilities)\n",
    "            if self.popularities[self.item_choice]<500:\n",
    "                self.item_rating = 1\n",
    "            else:\n",
    "                self.item_rating = 5\n",
    "        else:\n",
    "            raise ValueError(\"Invalid user type. Please choose a valid user type.\")\n",
    "        "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Reachability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from tqdm import tqdm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor_single(user_vector, items, ratings):\n",
    "    Q_list = [model_last_item.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor(user_vector, items, ratings):\n",
    "    Q_list = [model.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_user_tensor_five(user_vector, items, ratings):\n",
    "    Q_list = [model_last_five.qi[item] for item in items]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!export https_proxy=http://proxy.cmu.edu:3128/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!export http_proxy=http://proxy.cmu.edu:3128/"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch.nn.functional as F\n",
    "def get_all_recommendations_stochastic(user_vector, sample_size, beta = 0.8):\n",
    "    num_samples = sample_size\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "        predicted_ratings[item] = item_rating\n",
    "    \n",
    "    # Convert the predicted ratings dictionary to PyTorch tensor\n",
    "    ratings_tensor_1 = torch.tensor(list(predicted_ratings.values()), dtype=torch.float)\n",
    "    \n",
    "    # Compute probabilities proportional to exp(beta*predicted_rating)\n",
    "    probabilities = F.softmax(beta * ratings_tensor_1, dim=0)\n",
    "    \n",
    "    # Sample num_samples items based on the probability distribution\n",
    "    sampled_indices = torch.multinomial(probabilities, num_samples, replacement=False)\n",
    "    \n",
    "    # Convert indices to item names and corresponding predicted scores\n",
    "    sampled_items = [list(predicted_ratings.keys())[idx] for idx in sampled_indices]\n",
    "    # sampled_scores = [list(available_items.values())[idx] for idx in sampled_indices]\n",
    "    \n",
    "    return sampled_items"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_all_recommendation_scores_stochastic(user_vector, sample_size, type_, beta = 0.8):\n",
    "    device = user_vector.device\n",
    "    num_samples = sample_size\n",
    "    if type_ == 'keepall':\n",
    "        n_items =len(model.qi)\n",
    "    if type_ == 'single':\n",
    "        n_items =len(model_last_item.qi)\n",
    "    if type_ == 'five':\n",
    "        n_items =len(model_last_five.qi)\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "    if type_ == 'keepall':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model.qi[item])#.to(device)\n",
    "            predicted_ratings[item] = item_rating\n",
    "    if type_ == 'single':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_item.qi[item])\n",
    "            predicted_ratings[item] = item_rating    \n",
    "    if type_ == 'five':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_five.qi[item])\n",
    "            predicted_ratings[item] = item_rating       \n",
    "    \n",
    "    # Convert the predicted ratings dictionary to PyTorch tensor\n",
    "    ratings_tensor_1 = torch.tensor(list(predicted_ratings.values()), dtype=torch.float)\n",
    "    \n",
    "    # Compute probabilities proportional to exp(beta*predicted_rating)\n",
    "    probabilities = F.softmax(beta * ratings_tensor_1, dim=0)\n",
    "    \n",
    "    # Sample num_samples items based on the probability distribution\n",
    "    sampled_indices = torch.multinomial(probabilities, num_samples, replacement=False)\n",
    "    \n",
    "    # Convert indices to item names and corresponding predicted scores\n",
    "    sampled_items = [list(predicted_ratings.keys())[idx] for idx in sampled_indices]\n",
    "    sampled_scores = [list(predicted_ratings.values())[idx] for idx in sampled_indices]\n",
    "    \n",
    "    return sampled_items, sampled_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_all_recommendation_scores_deterministic(user_vector, sample_size, type_, beta=0.8):\n",
    "    device = user_vector.device\n",
    "    num_samples = sample_size\n",
    "\n",
    "    if type_ == 'keepall':\n",
    "        n_items = len(model.qi)\n",
    "    if type_ == 'single':\n",
    "        n_items = len(model_last_item.qi)\n",
    "    if type_ == 'five':\n",
    "        n_items = len(model_last_five.qi)\n",
    "\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "\n",
    "    if type_ == 'keepall':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model.qi[item])\n",
    "            predicted_ratings[item] = item_rating\n",
    "    if type_ == 'single':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_item.qi[item])\n",
    "            predicted_ratings[item] = item_rating\n",
    "    if type_ == 'five':\n",
    "        for item in range(0, n_items):\n",
    "            item_rating = user_vector @ torch.tensor(model_last_five.qi[item])\n",
    "            predicted_ratings[item] = item_rating\n",
    "\n",
    "    # Find the item with the highest predicted rating\n",
    "    max_item_index = max(predicted_ratings, key=predicted_ratings.get)\n",
    "    max_item_score = predicted_ratings[max_item_index]\n",
    "\n",
    "    return [max_item_index], [max_item_score]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Finalized\n",
    "#What I compare with is the first value\n",
    "\n",
    "def past_user_item_reachability(user_id, item_id, past_time):\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating =  trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating = torch.exp(0.8 * torch.matmul(torch.tensor(model.pu[20]), torch.tensor(model.qi[25])))\n",
    "    total_sum = 0\n",
    "    for item in range(len(model_last_five.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(torch.tensor(model.pu[20]), torch.tensor(model.qi[item])))\n",
    "    print(final_rating/total_sum)   \n",
    "    \n",
    "    final_rating=0\n",
    "    for epoch in range(1, 100):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "        user_vector_initial = torch.tensor(model_last_five.pu[user_id])\n",
    "        user_vector = user_vector_initial\n",
    "        time_max = past_time\n",
    "        already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "        already_rated = already_rated[:-past_time]\n",
    "        ratings_old = rating_tensor[:-past_time]\n",
    "        n = len(ratings_old)\n",
    "        zeros_to_add = torch.zeros(time_max)\n",
    "        ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        for timestep in range(0,time_max):\n",
    "            curr_item = chosen_items[timestep]\n",
    "            ratings[n+timestep] = user_action_clamped[timestep]\n",
    "            already_rated.append(curr_item)\n",
    "            user_vector = update_user_tensor_five(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "        total_sum = 0\n",
    "        for item in range(len(model_last_five.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model_last_five.qi[item])))\n",
    "            #print(final_rating/total_sum)  \n",
    "        item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model_last_five.qi[item_to_be_reached])))/total_sum\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "        #user_action = user_action.clamp(1, 5) \n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.set_printoptions(precision=7)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(past_user_item_reachability(20,25,5))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Finalized, but stochastic so it doesn't work well\n",
    "\n",
    "#too many parameters\n",
    "\n",
    "def future_user_item_reachability(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    # item_and_rating =  trainset.ur[user_id][-future_time:]\n",
    "    chosen_ratings = [5] * future_time * len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating=0\n",
    "    \n",
    "    item_ratings_list = []\n",
    "    \n",
    "    for epoch in tqdm(range(1, 30)):\n",
    "        rating_vals = torch.zeros(100)\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "            ratings_old = rating_tensor\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_stochastic(user_vector, sample_size=1, type_=\"keepall\")\n",
    "                ratings[n+timestep] = user_action_clamped[5*recommendation[0]+timestep]\n",
    "                already_rated.append(recommendation[0])\n",
    "                user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            total_sum = 0\n",
    "            for item in range(len(model.qi)):\n",
    "                total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item])))\n",
    "            rating_vals[int_var] = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))/total_sum\n",
    "            #print(item_rating)\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        item_ratings_list.append(-item_rating.item())\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "    plt.figure(figsize=(10, 6))\n",
    "    plt.plot(item_ratings_list)\n",
    "    plt.xlabel('Epoch')\n",
    "    plt.ylabel('Item Rating')\n",
    "    plt.title('Item Rating vs. Epoch')\n",
    "    plt.show()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Finalized, works well, only slowly\n",
    "\n",
    "#too many parameters\n",
    "#deterministic\n",
    "\n",
    "def future_user_item_reachability(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    # item_and_rating =  trainset.ur[user_id][-future_time:]\n",
    "    chosen_ratings = [5] * future_time * len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=1)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating=0\n",
    "    \n",
    "    rating_vals_ = torch.zeros(10)\n",
    "    for upper_var in range(1,10):\n",
    "        user_vector_ = torch.tensor(model.pu[user_id])\n",
    "        already_rated_ = list(user_item_rating_dict[user_id].keys())\n",
    "        ratings_old_ = torch.tensor(list(ratings_dict.values()))\n",
    "        n = len(ratings_old_)\n",
    "        zeros_to_add = torch.zeros(future_time)\n",
    "        ratings_ = torch.cat((ratings_old_, zeros_to_add), dim=0)\n",
    "        for timestep in range(0,future_time):\n",
    "            recommendation, recommendation_score = get_all_recommendation_scores_deterministic(user_vector_, sample_size=1, type_=\"keepall\")\n",
    "            ratings_[n+timestep] = user_vector_ @ torch.tensor(model.qi[recommendation[0]])\n",
    "            already_rated_.append(recommendation[0])\n",
    "            user_vector_ = update_user_tensor(user_vector_, already_rated_, ratings_[:n+timestep+1])\n",
    "        total_sum = 0\n",
    "        for item in range(len(model.qi)):\n",
    "            total_sum += torch.exp(0.8 * torch.matmul(user_vector_, torch.tensor(model.qi[item])))\n",
    "        rating_vals_[upper_var] = -torch.exp(0.8*torch.matmul(user_vector_, torch.tensor(model.qi[item_to_be_reached])))/total_sum\n",
    "    init_val = torch.mean(rating_vals_)\n",
    "    #print(init_val)\n",
    "    \n",
    "    for epoch in tqdm(range(1, 10)):\n",
    "        rating_vals = torch.zeros(10)\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "            ratings_old = rating_tensor\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_deterministic(user_vector, sample_size=1, type_=\"keepall\")\n",
    "                ratings[n+timestep] = user_action_clamped[5*recommendation[0]+timestep]\n",
    "                already_rated.append(recommendation[0])\n",
    "                user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            total_sum = 0\n",
    "            for item in range(len(model.qi)):\n",
    "                total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item])))\n",
    "            rating_vals[int_var] = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))/total_sum\n",
    "            #print(item_rating)\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = item_rating.item()/init_val.item()\n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# #Finalized, works well, only slowly\n",
    "\n",
    "# #too many parameters\n",
    "# #deterministic\n",
    "\n",
    "# def future_user_item_reachability(user_id, item_id, future_time):\n",
    "#     item_to_be_reached = item_id\n",
    "#     # item_and_rating =  trainset.ur[user_id][-future_time:]\n",
    "#     chosen_ratings = [5] * future_time * len(model.qi)\n",
    "#     user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "#     optimizer = torch.optim.Adam([user_action], lr=1)\n",
    "#     # reach_probabilities = []\n",
    "#     ratings_dict1 = user_item_rating_dict[user_id]\n",
    "#     for j in user_item_rating_dict[user_id]:\n",
    "#         ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "#     ratings_dict = ratings_dict1\n",
    "#     final_rating=0\n",
    "    \n",
    "#     rating_vals_ = torch.zeros(10)\n",
    "#     for upper_var in range(0,10):\n",
    "#         user_vector_ = torch.tensor(model.pu[user_id])\n",
    "#         already_rated_ = list(user_item_rating_dict[user_id].keys())\n",
    "#         ratings_old_ = torch.tensor(list(ratings_dict.values()))\n",
    "#         n = len(ratings_old_)\n",
    "#         zeros_to_add = torch.zeros(future_time)\n",
    "#         ratings_ = torch.cat((ratings_old_, zeros_to_add), dim=0)\n",
    "#         for timestep in range(0,future_time):\n",
    "#             recommendation, recommendation_score = get_all_recommendation_scores_deterministic(user_vector_, sample_size=1, type_=\"keepall\")\n",
    "#             ratings_[n+timestep] = user_vector_ @ torch.tensor(model.qi[recommendation[0]])\n",
    "#             already_rated_.append(recommendation[0])\n",
    "#             user_vector_ = update_user_tensor(user_vector_, already_rated_, ratings_[:n+timestep+1])\n",
    "#         total_sum = 0\n",
    "#         for item in range(len(model.qi)):\n",
    "#             total_sum += torch.exp(0.8 * torch.matmul(user_vector_, torch.tensor(model.qi[item])))\n",
    "#         rating_vals_[upper_var] = -torch.exp(0.8*torch.matmul(user_vector_, torch.tensor(model.qi[item_to_be_reached])))/total_sum\n",
    "#     init_val = torch.mean(rating_vals_)\n",
    "#     print(init_val)\n",
    "    \n",
    "#     item_ratings_list = []\n",
    "    \n",
    "#     for epoch in tqdm(range(1, 8)):\n",
    "#         rating_vals = torch.zeros(10)\n",
    "#         for int_var in range(0,len(rating_vals)):\n",
    "#             user_action_clamped = user_action.clamp(1, 5)\n",
    "#             rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "#             user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "#             user_vector = user_vector_initial\n",
    "#             time_max = future_time\n",
    "#             already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "#             ratings_old = rating_tensor\n",
    "#             n = len(ratings_old)\n",
    "#             zeros_to_add = torch.zeros(time_max)\n",
    "#             ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "#             for timestep in range(0,time_max):\n",
    "#                 recommendation, recommendation_score = get_all_recommendation_scores_deterministic(user_vector, sample_size=1, type_=\"keepall\")\n",
    "#                 ratings[n+timestep] = user_action_clamped[5*recommendation[0]+timestep]\n",
    "#                 already_rated.append(recommendation[0])\n",
    "#                 user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "#             total_sum = 0\n",
    "#             for item in range(len(model.qi)):\n",
    "#                 total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item])))\n",
    "#             rating_vals[int_var] = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))/total_sum\n",
    "#             #print(item_rating)\n",
    "#         item_rating = sum(rating_vals)/len(rating_vals)\n",
    "#         item_ratings_list.append(-item_rating.item())\n",
    "#         item_rating.backward()\n",
    "#         optimizer.step()\n",
    "#         # print(user_action)\n",
    "#         optimizer.zero_grad()\n",
    "#     plt.figure(figsize=(10, 6))\n",
    "#     plt.plot(item_ratings_list)\n",
    "#     plt.xlabel('Epoch')\n",
    "#     plt.ylabel('Item Rating')\n",
    "#     plt.title('Item Rating vs. Epoch')\n",
    "#     plt.show()\n",
    "\n",
    "#     final_rating = item_rating.item()/init_val.item()\n",
    "#     return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# #gpu\n",
    "# import torch\n",
    "# from tqdm import tqdm\n",
    "# import matplotlib.pyplot as plt\n",
    "\n",
    "# def future_user_item_reachability(user_id, item_id, future_time):\n",
    "#     device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "\n",
    "#     item_to_be_reached = item_id\n",
    "#     chosen_ratings = [5] * future_time * len(model.qi)\n",
    "#     user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "#     optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "\n",
    "#     ratings_dict1 = user_item_rating_dict[user_id]\n",
    "#     for j in user_item_rating_dict[user_id]:\n",
    "#         ratings_dict1[j] = torch.tensor(ratings_dict1[j], dtype=torch.float64).to(device)\n",
    "#     ratings_dict = ratings_dict1\n",
    "\n",
    "#     final_rating = 0\n",
    "#     item_ratings_list = []\n",
    "\n",
    "#     for epoch in tqdm(range(1, 100)):\n",
    "        \n",
    "#         user_action_clamped = user_action.clamp(1, 5)\n",
    "#         rating_tensor = torch.tensor(list(ratings_dict.values())).to(device)\n",
    "#         user_vector_initial = torch.tensor(model.pu[user_id]).to(device)\n",
    "#         user_vector = user_vector_initial\n",
    "\n",
    "#         time_max = future_time\n",
    "#         already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "#         ratings_old = rating_tensor\n",
    "#         n = len(ratings_old)\n",
    "#         zeros_to_add = torch.zeros(time_max).to(device)\n",
    "#         ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "\n",
    "#         for timestep in range(0, time_max):\n",
    "#             recommendation, recommendation_score = get_all_recommendation_scores_stochastic(user_vector, sample_size=1, type_=\"keepall\")\n",
    "#             ratings[n+timestep] = user_action_clamped[5*recommendation[0]+timestep]\n",
    "#             already_rated.append(recommendation[0])\n",
    "#             user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "\n",
    "#         total_sum = 0\n",
    "#         for item in range(len(model.qi)):\n",
    "#             total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item]).to(device)))\n",
    "\n",
    "#         item_rating = -torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached]).to(device))) / total_sum\n",
    "#         print(item_rating)\n",
    "#         item_ratings_list.append(-item_rating.item())\n",
    "\n",
    "#         item_rating.backward()\n",
    "#         optimizer.step()\n",
    "#         optimizer.zero_grad()\n",
    "\n",
    "#     plt.figure(figsize=(10, 6))\n",
    "#     plt.plot(item_ratings_list)\n",
    "#     plt.xlabel('Epoch')\n",
    "#     plt.ylabel('Item Rating')\n",
    "#     plt.title('Item Rating vs. Epoch')\n",
    "#     plt.show()\n",
    "\n",
    "#     final_rating = -item_rating.item()\n",
    "#     return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#modified version with more samples for more stable gradient\n",
    "\n",
    "def future_user_item_reachability(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating =  trainset.ur[user_id][-future_time:]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    \n",
    "    final_rating=0\n",
    "    min_item_rating = 0\n",
    "    best_user = torch.tensor(model.pu[user_id])\n",
    "    for epoch in range(1, 50):\n",
    "        rating_vals =torch.zeros(100)\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "            ratings_old = rating_tensor\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_stochastic(user_vector, sample_size=1, type_=\"keepall\")\n",
    "                ratings[n+timestep] = user_action_clamped[timestep]\n",
    "                already_rated.append(recommendation[0])\n",
    "                user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            rating_vals[int_var] = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        print(item_rating)\n",
    "        #save the one with the best value? then check later\n",
    "        if item_rating < min_item_rating:\n",
    "            min_item_rating = item_rating.detach()\n",
    "            best_user = user_vector.detach()\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(model.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(best_user, torch.tensor(model.qi[item])))\n",
    "    return final_rating/total_sum    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def update_user_tensor(user_vector, items, ratings):\n",
    "#     device = user_vector.device  # Get the device of user_vector\n",
    "#     Q_list = [model.qi[item] for item in items]\n",
    "#     Q = torch.tensor(Q_list, dtype=torch.float64).to(device)  # Move Q to the same device as user_vector\n",
    "#     ratings = ratings.to(device)  # Move ratings to the same device as user_vector\n",
    "#     p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "#     return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.set_device(7)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_user_item_reachability(221,3418,5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Again, I will be comparing to initial value"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "33 minutes for 3000 runs essentially"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#0.000269"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#probability that item is recommended to me at t0+1, without me doing anything"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#0.0001885"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#future with fixed rating for each item instead of fixed rating for each time\n",
    "def future_user_item_reachability_2(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    chosen_ratings = [5.0]*len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating=0\n",
    "    for epoch in range(1, 500):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "        user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "        user_vector = user_vector_initial\n",
    "        time_max = future_time\n",
    "        already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "        ratings_old = rating_tensor\n",
    "        n = len(ratings_old)\n",
    "        zeros_to_add = torch.zeros(time_max)\n",
    "        ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        for timestep in range(0,time_max):\n",
    "            recommendation, recommendation_score = get_all_recommendation_scores_stochastic(user_vector, sample_size=1)\n",
    "            ratings[n+timestep] = user_action_clamped[recommendation]\n",
    "            already_rated.append(recommendation[0])\n",
    "            user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "        item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(model.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item])))\n",
    "    return final_rating/total_sum    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#modified version with more samples for more stable gradient\n",
    "\n",
    "#future with fixed rating for each item instead of fixed rating for each time\n",
    "def future_user_item_reachability_2(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    chosen_ratings = [5.0]*len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating=0\n",
    "    for epoch in range(1, 50):\n",
    "        rating_vals = torch.zeros(100)\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "            user_vector_initial = torch.tensor(model.pu[user_id])\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "            ratings_old = rating_tensor\n",
    "            n = len(ratings_old)\n",
    "            zeros_to_add = torch.zeros(time_max)\n",
    "            ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_stochastic(user_vector, sample_size=1)\n",
    "                ratings[n+timestep] = user_action_clamped[recommendation]\n",
    "                already_rated.append(recommendation[0])\n",
    "                user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            rating_vals[int_var] =  -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(model.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model.qi[item])))\n",
    "    return final_rating/total_sum    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_user_item_reachability(20,25,5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Stability time"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#PAST STABILITY\n",
    "#CHOOSE 10 RANDOM USERS AS ADVERSARIES\n",
    "#NOW LETS LOOK AT THE PAST-1-STABILITY OF INFLUENTIAL AND MID USERS TO THEIR ACTIONS\n",
    "#PARAMETER SPACE WILL BE 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 3703 items\n",
    "# 5 items\n",
    "# 3698\n",
    "#\n",
    "\n",
    "def get_all_preferences(user_vector_1, item_vector_copy_h):\n",
    "    # Compute ratings for each item by dot product with user_vector\n",
    "    temp_vector = user_vector_1.detach().clone()\n",
    "    item_ratings = torch.matmul(item_vector_copy_h, temp_vector.unsqueeze(1))\n",
    "    return item_ratings.squeeze(1) \n",
    "\n",
    "# def get_all_preferences(user_vector, item_vector_copy_h, already_rated):\n",
    "#     item_ratings = torch.matmul(item_vector_copy_h, user_vector.unsqueeze(1)).squeeze(1)\n",
    "#     sorted_indices = torch.argsort(item_ratings, descending=True)\n",
    "    \n",
    "#     # # Create a mask indicating whether each item is already rated\n",
    "#     # mask = torch.zeros_like(item_ratings, dtype=torch.bool)\n",
    "#     # mask[already_rated] = True\n",
    "    \n",
    "#     # # Filter out the indices of items that are not already rated\n",
    "#     # unrated_indices = sorted_indices[~mask]\n",
    "    \n",
    "#     return sorted_indices\n",
    "\n",
    "# def get_all_preferences(user_vector, item_vector_copy, already_rated):\n",
    "#     predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "#     for item in range(0, n_items):\n",
    "#         item_rating = user_vector @ torch.tensor(item_vector_copy[item])\n",
    "#         predicted_ratings[item] = item_rating\n",
    "#     sorted_pred_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "#     count_var = 0\n",
    "#     unrated_item_names=[]\n",
    "#     for i in sorted_pred_ratings:\n",
    "#         item_id = i[0]\n",
    "#         if item_id not in already_rated:\n",
    "#             count_var+=1\n",
    "#             unrated_item_names.append(item_id)\n",
    "#     return torch.tensor(unrated_item_names)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_item_tensor_one(item_vector, users, ratings):\n",
    "    Q_list = [model_last_item.pu[user] for user in users]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_item_tensor_five(item_vector, users, ratings):\n",
    "    Q_list = [model_last_five.pu[user] for user in users]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def update_item_tensor(item_vector, users, ratings):\n",
    "    Q_list = [model.pu[user] for user in users]\n",
    "    Q = torch.tensor(Q_list, dtype=torch.float64)\n",
    "    # p = np.linalg.inv(Q.T @ Q) @ Q.T @ ratings\n",
    "    p = torch.inverse(Q.t() @ Q) @ Q.t() @ ratings\n",
    "    return p"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mse = torch.nn.MSELoss()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_user_matrix = trainset.ir\n",
    "item_user_matrix1 = trainset1.ir\n",
    "item_user_matrix5 = trainset5.ir"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "item_user_rating_dict = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for item, users_ratings in item_user_matrix.items():\n",
    "    users_dict = {user: rating for user, rating in users_ratings}\n",
    "    item_user_rating_dict[item] = users_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "item_user_rating_tensor = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for item_id, user_rating_dict in item_user_rating_dict.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    user_rating_list = list(user_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    user_rating_tensors = [torch.tensor([[user_id, rating]], dtype=torch.float) for user_id, rating in user_rating_list]\n",
    "    user_rating_tensor = torch.stack(user_rating_tensors)\n",
    "\n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    item_user_rating_tensor[item_id] = user_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "item_user_rating_dict1 = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for item, users_ratings in item_user_matrix1.items():\n",
    "    users_dict = {user: rating for user, rating in users_ratings}\n",
    "    item_user_rating_dict1[item] = users_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "item_user_rating_tensor1 = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for item_id, user_rating_dict in item_user_rating_dict1.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    user_rating_list = list(user_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    user_rating_tensors = [torch.tensor([[user_id, rating]], dtype=torch.float) for user_id, rating in user_rating_list]\n",
    "    user_rating_tensor = torch.stack(user_rating_tensors)\n",
    "    \n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    item_user_rating_tensor1[item_id] = user_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Convert to a dictionary of dictionaries\n",
    "item_user_rating_dict5 = defaultdict(dict)\n",
    "\n",
    "# Populate the user_item_rating_dict\n",
    "for item, users_ratings in item_user_matrix5.items():\n",
    "    users_dict = {user: rating for user, rating in users_ratings}\n",
    "    item_user_rating_dict5[item] = users_dict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "item_user_rating_tensor5 = {}\n",
    "\n",
    "# Iterate over each user_id and their item-rating dictionary\n",
    "for item_id, user_rating_dict in item_user_rating_dict5.items():\n",
    "    # Convert the item-rating dictionary to a list of tuples\n",
    "    user_rating_list = list(user_rating_dict.items())\n",
    "    \n",
    "    # Convert the list of tuples to a tensor\n",
    "    user_rating_tensors = [torch.tensor([[user_id, rating]], dtype=torch.float) for user_id, rating in user_rating_list]\n",
    "    user_rating_tensor = torch.stack(user_rating_tensors)\n",
    "    \n",
    "    # Store the item-rating tensor in the converted dictionary with the user_id as the key\n",
    "    item_user_rating_tensor5[item_id] = user_rating_tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay so for a single user, lets look at a single adversarial user and see the impact on stability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#I will see the last k ratings for the adversarial user"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch.nn.functional as F"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_k_stability(adversary, curr_user, k):\n",
    "    file_path = 'surprise_model_last_five.dump'\n",
    "    _, model_last_five = dump.load(file_path)\n",
    "    \n",
    "    item_and_rating = trainset.ur[adversary][-k:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [3., 3., 2., 5., 2.]#[i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.4)\n",
    "    \n",
    "    item_vector_copy = torch.tensor(model_last_five.qi)  # change as per k\n",
    "    user_vector = torch.tensor(model_last_five.pu[curr_user])\n",
    "    \n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "    initial_rec_list_softmax = F.softmax(initial_rec_list, dim=0)\n",
    "    #print(initial_rec_list_softmax)\n",
    "    #print(initial_rec_list)\n",
    "    \n",
    "    n_epochs = 20\n",
    "    distance_metric = None\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        item_vector_copy_tensor = torch.tensor(model_last_five.qi)  # change as per k\n",
    "        \n",
    "        for loop_var in range(0, k):\n",
    "            curr_item = chosen_items[loop_var]\n",
    "            user_list = [item_user_matrix5[curr_item][i][0] for i in range(len(item_user_matrix5[curr_item]))]  # change as per k\n",
    "            rating_list = torch.tensor([item_user_matrix5[curr_item][i][1] for i in range(len(item_user_matrix5[curr_item]))], dtype=torch.float64)  # change as per k\n",
    "            user_list.append(adversary)\n",
    "            rating_list = torch.cat((rating_list, user_action_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "            item_vector_copy_tensor[curr_item] = update_item_tensor_five(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "        \n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "        final_rec_list_softmax = F.softmax(final_rec_list, dim=0)\n",
    "        #print(max(final_rec_list))\n",
    "        print(sum(final_rec_list_softmax))\n",
    "        distance_metric = -hellinger_distance(final_rec_list_softmax, initial_rec_list_softmax)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        print(user_action)\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    \n",
    "    return distance_metric.item()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.rcParams.update({'font.size': 14, 'axes.labelsize': 16, 'xtick.labelsize': 14, 'ytick.labelsize': 12, 'legend.fontsize': 14, 'axes.titlesize': 18})\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#20,25,5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "past_k_stability(201, 2568, 5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def future_k_stability(adversary, curr_user, k):\n",
    "#     file_path = 'surprise_model_full.dump'\n",
    "#     # Load the saved model\n",
    "#     _, model = dump.load(file_path)\n",
    "#     adversary_vector = torch.tensor(model.pu[adversary])\n",
    "#     already_rated = list(user_item_rating_dict[adversary].keys()) \n",
    "#     chosen_ratings = [5.0]*k\n",
    "#     user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "#     optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "#     item_vector_copy = torch.tensor(model.qi)\n",
    "#     user_vector = torch.tensor(model.pu[curr_user])\n",
    "#     initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "#     n_epochs = 50\n",
    "#     distance_metric = None\n",
    "#     for epoch in tqdm(range(0, n_epochs)):\n",
    "#         distance_vals = torch.zeros(100)\n",
    "#         for ave_var in range(0,len(distance_vals)):\n",
    "#             _, model = dump.load(file_path)\n",
    "#             already_rated = list(user_item_rating_dict[adversary].keys())\n",
    "#             user_action_clamped = user_action.clamp(1, 5)\n",
    "#             item_vector_copy_tensor = torch.tensor(model.qi)\n",
    "#             for loop_var in range(0,k):\n",
    "#                 curr_item, recommendation_score = get_all_recommendation_scores_stochastic(adversary_vector, sample_size=1, type_=\"keepall\")\n",
    "#                 curr_item = curr_item[0]\n",
    "#                 already_rated.append(curr_item)\n",
    "#                 user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "#                 rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "#                 if adversary not in user_list:\n",
    "#                     user_list.append(adversary)\n",
    "#                     rating_list = torch.cat((rating_list, user_action_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "#                 else:\n",
    "#                     ind = user_list.index(adversary)\n",
    "#                     rating_list[ind] = user_action_clamped[loop_var]\n",
    "#                 item_vector_copy_tensor[curr_item] = update_item_tensor(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "#             final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "#             distance_vals[ave_var] = -mse(final_rec_list,initial_rec_list)\n",
    "#             # print(distance_vals[ave_var])\n",
    "#         distance_metric = sum(distance_vals)/len(distance_vals)\n",
    "#         print(distance_metric)\n",
    "        \n",
    "#         distance_metric.backward()\n",
    "#         optimizer.step()\n",
    "#         optimizer.zero_grad()\n",
    "#     return distance_metric.item()\n",
    "            \n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#deterministic\n",
    "\n",
    "\n",
    "def future_k_stability(adversary, curr_user, k):\n",
    "    file_path = 'surprise_model_full.dump'\n",
    "#     # Load the saved model\n",
    "    _, model = dump.load(file_path)\n",
    "    adversary_vector = torch.tensor(model.pu[adversary])\n",
    "    already_rated = list(user_item_rating_dict[adversary].keys()) \n",
    "    chosen_ratings = [2.0]*k*len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.8)\n",
    "    item_vector_copy = torch.tensor(model.qi)\n",
    "    user_vector = torch.tensor(model.pu[curr_user])\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "    initial_rec_list_softmax = F.softmax(initial_rec_list, dim=0)\n",
    "    n_epochs = 15\n",
    "    distance_metric = None\n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        rating_vals = torch.zeros(10)\n",
    "        for outer_var in range(0,len(rating_vals)):\n",
    "            already_rated = list(user_item_rating_dict[adversary].keys())\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            item_vector_copy_tensor = torch.tensor(model.qi)\n",
    "            for loop_var in range(0,k):\n",
    "                curr_item, recommendation_score = get_all_recommendation_scores_deterministic(adversary_vector, sample_size=1, type_=\"keepall\")\n",
    "                curr_item = curr_item[0]\n",
    "                already_rated.append(curr_item)\n",
    "                user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "                rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "                if adversary not in user_list:\n",
    "                    user_list.append(adversary)\n",
    "                    rating_list = torch.cat((rating_list, user_action_clamped[5*curr_item+loop_var].unsqueeze(0)), dim=0)\n",
    "                else:\n",
    "                    ind = user_list.index(adversary)\n",
    "                    rating_list[ind] = user_action_clamped[5*curr_item+loop_var]\n",
    "                item_vector_copy_tensor[curr_item] = update_item_tensor(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "            final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "            final_rec_list_softmax = F.softmax(final_rec_list, dim=0)\n",
    "            rating_vals[outer_var] = -hellinger_distance(final_rec_list_softmax,initial_rec_list_softmax)\n",
    "        distance_metric = sum(rating_vals)/len(rating_vals)\n",
    "        print(rating_vals)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    return distance_metric.item()\n",
    "            "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def future_k_stability(adversary, curr_user, k):\n",
    "    file_path = 'surprise_model_full.dump'\n",
    "#     # Load the saved model\n",
    "    _, model = dump.load(file_path)\n",
    "    adversary_vector = torch.tensor(model.pu[adversary])\n",
    "    already_rated = list(user_item_rating_dict[adversary].keys()) \n",
    "    chosen_ratings = [5.0]*k\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    item_vector_copy = torch.tensor(model.qi)\n",
    "    user_vector = torch.tensor(model.pu[curr_user])\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "    n_epochs = 500\n",
    "    distance_metric = None\n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        already_rated = list(user_item_rating_dict[adversary].keys())\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        item_vector_copy_tensor = torch.tensor(model.qi)\n",
    "        for loop_var in range(0,k):\n",
    "            curr_item, recommendation_score = get_all_recommendation_scores_stochastic(adversary_vector, sample_size=1, type_=\"keepall\")\n",
    "            curr_item = curr_item[0]\n",
    "            already_rated.append(curr_item)\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "            if adversary not in user_list:\n",
    "                user_list.append(adversary)\n",
    "                rating_list = torch.cat((rating_list, user_action_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "            else:\n",
    "                ind = user_list.index(adversary)\n",
    "                rating_list[ind] = user_action_clamped[loop_var]\n",
    "            item_vector_copy_tensor[curr_item] = update_item_tensor(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "        distance_metric = -mse(final_rec_list,initial_rec_list)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    return distance_metric.item()\n",
    "            "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_k_stability(20, 5, 5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def future_k_stability_2(adversary, curr_user, k):\n",
    "    file_path = 'surprise_model_full.dump'\n",
    "#     # Load the saved model\n",
    "    _, model = dump.load(file_path)\n",
    "    adversary_vector = torch.tensor(model.pu[adversary])\n",
    "    already_rated = list(user_item_rating_dict[adversary].keys()) \n",
    "    chosen_ratings = [5.0]*len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    item_vector_copy = torch.tensor(model.qi)\n",
    "    user_vector = torch.tensor(model.pu[curr_user])\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "    n_epochs = 500\n",
    "    distance_metric = None\n",
    "    already_rated = list(user_item_rating_dict[adversary].keys())\n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        item_vector_copy_tensor = torch.tensor(model.qi)\n",
    "        for loop_var in range(0,k):\n",
    "            curr_item, recommendation_score = get_all_recommendation_scores_stochastic(adversary_vector, sample_size=1, type_=\"keepall\")\n",
    "            curr_item = curr_item[0]\n",
    "            already_rated.append(curr_item)\n",
    "            user_list = [item_user_matrix[curr_item][i][0] for i in range(len(item_user_matrix[curr_item]))]\n",
    "            rating_list = torch.tensor([item_user_matrix[curr_item][i][1] for i in range(len(item_user_matrix[curr_item]))], dtype = torch.float64)\n",
    "            if adversary not in user_list:\n",
    "                user_list.append(adversary)\n",
    "                rating_list = torch.cat((rating_list, user_action_clamped[curr_item].unsqueeze(0)), dim=0)\n",
    "            else:\n",
    "                ind = user_list.index(adversary)\n",
    "                rating_list[ind] = user_action_clamped[curr_item]\n",
    "            item_vector_copy_tensor[curr_item] = update_item_tensor(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "        distance_metric = -mse(final_rec_list,initial_rec_list)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    return distance_metric.item()\n",
    "            \n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_k_stability_2(20, 25, 5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "MeZO"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def perturb_parameters(theta,epsilon,s):\n",
    "    torch.manual_seed(s)\n",
    "    z_temp = torch.randn(1)\n",
    "    theta_next = theta + epsilon*z_temp\n",
    "    return theta_next\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# theta = torch.tensor(0.)\n",
    "# theta1 = perturb_parameters(theta, 0.1, 0)\n",
    "# theta2 = perturb_parameters(theta, -0.1, 0)\n",
    "# print(theta)\n",
    "# print(theta1)\n",
    "# print(theta2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# #Deterministic choice\n",
    "# # import wandb\n",
    "\n",
    "# # wandb.init(project=\"reachability-single-deterministic\", name=\"run_1_lr_0.08\")\n",
    "# sample_size=1\n",
    "# user_action = torch.tensor(chosen_rating, dtype=torch.float64)\n",
    "# lr = 0.08\n",
    "# item_to_be_reached = 971\n",
    "# min_score = float('inf')\n",
    "# for epoch in range(1, 50):\n",
    "#     user_action_clamped = user_action.clamp(1, 5) \n",
    "#     user_action_post = perturb_parameters(user_action, 0.1, 0)\n",
    "#     user_action_pre = perturb_parameters(user_action, -0.1, 0)\n",
    "#     user_action_post_clamped = user_action_post.clamp(1,5)\n",
    "#     user_action_pre_clamped = user_action_pre.clamp(1,5)\n",
    "#     rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "#     user_vector_initial = torch.tensor(model.pu[5])\n",
    "#     user_vector = user_vector_initial\n",
    "#     time_max = 0\n",
    "#     already_rated = list(user_item_rating_dict[5].keys())\n",
    "#     #already_rated = already_rated[:-1]\n",
    "#     ratings_old = rating_tensor#user_item_rating_dict[5]\n",
    "#     ratings_old_pre = rating_tensor.detach().clone()\n",
    "#     ratings_old_post = rating_tensor.detach().clone()\n",
    "#     ratings_old_pre[-1] = user_action_pre_clamped\n",
    "#     ratings_old_post[-1] = user_action_post_clamped\n",
    "#     # del ratings[chosen_item]\n",
    "#     ratings_old[-1] = user_action_clamped#ratings[chosen_item] = user_action\n",
    "#     torch.manual_seed(0)\n",
    "#     z = torch.randn(1)\n",
    "#     # ratings_old_temp = torch.cat((ratings_old[:-1], user_action), dim=0)\n",
    "#     n = len(ratings_old)\n",
    "#     zeros_to_add = torch.zeros(time_max)\n",
    "#     ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "#     ratings_pre = torch.cat((ratings_old_pre, zeros_to_add), dim=0)\n",
    "#     ratings_post = torch.cat((ratings_old_post, zeros_to_add), dim=0)\n",
    "#     #already_rated.append(chosen_item)\n",
    "#     user_vector = update_user_tensor(user_vector, already_rated, ratings[:n])\n",
    "#     user_vector_pre = update_user_tensor(user_vector, already_rated, ratings_pre[:n])\n",
    "#     user_vector_post = update_user_tensor(user_vector, already_rated, ratings_post[:n])\n",
    "#     for timestep in range(1, time_max+1):\n",
    "#         recommendations, recommendation_scores = get_recommendation_scores_stochastic(user_vector, already_rated, sample_size)\n",
    "#         # usr_type = UserType(\"Choice Enjoyer\", recommendation_scores, [], beta=0.8)\n",
    "#         choice_of_item = recommendations[0]\n",
    "#         ratings[n+timestep-1] = 5\n",
    "#         already_rated.append(choice_of_item)\n",
    "#         user_vector = update_user_tensor(user_vector, already_rated, ratings[:n+timestep])\n",
    "#     item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model.qi[item_to_be_reached])))\n",
    "#     item_rating_pre = -torch.exp(0.8*torch.matmul(user_vector_pre, torch.tensor(model.qi[item_to_be_reached])))\n",
    "#     item_rating_post = -torch.exp(0.8*torch.matmul(user_vector_post, torch.tensor(model.qi[item_to_be_reached])))\n",
    "#     projected_grad = (item_rating_post-item_rating_pre)/(2*0.1)\n",
    "#     torch.manual_seed(0)\n",
    "#     user_action = user_action - lr*torch.randn(1)*projected_grad\n",
    "#     print(abs(item_rating))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# t1_set = trainset"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Last Five"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# #5 is the user we are looking at\n",
    "# item_and_rating =  trainset.ur[5][-5:]\n",
    "# chosen_items = [i[0] for i in item_and_rating]\n",
    "# chosen_ratings = [i[1] for i in item_and_rating]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# def perturb_parameters(theta,epsilon,s):\n",
    "#     torch.manual_seed(s)\n",
    "#     theta_new = theta.detach().clone()\n",
    "#     for i in range(0,len(theta)):\n",
    "#         z_temp = torch.randn(1)\n",
    "#         theta_new[i] = theta_new[i] + epsilon*z_temp\n",
    "#     return theta_new\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def perturb_parameters(theta,epsilon,s, z_temp):\n",
    "    torch.manual_seed(s)\n",
    "    theta_new = theta.detach().clone()\n",
    "    for i in range(0,len(theta)):\n",
    "        #z_temp = torch.randn(1)\n",
    "        theta_new[i] = theta_new[i] + epsilon*z_temp\n",
    "    return theta_new\n",
    "        "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def mezo_past_user_item_reachability(user_id, item_id, past_time):\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating =  trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64)\n",
    "    # reach_probabilities = []\n",
    "    ratings_dict1 = user_item_rating_dict[user_id]\n",
    "    for j in user_item_rating_dict[user_id]:\n",
    "        ratings_dict1[j]=torch.tensor(ratings_dict1[j], dtype=torch.float64)\n",
    "    ratings_dict = ratings_dict1\n",
    "    final_rating=0\n",
    "    for epoch in range(1, 10):\n",
    "        #print(user_action)\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        ####\n",
    "        z_temp = torch.randn(1)\n",
    "        user_action_post = perturb_parameters(user_action, 1, 0, z_temp)\n",
    "        user_action_pre = perturb_parameters(user_action, -1, 0, z_temp)\n",
    "        user_action_post_clamped = user_action_post.clamp(1,5)\n",
    "        user_action_pre_clamped = user_action_pre.clamp(1,5)\n",
    "        ####\n",
    "        rating_tensor = torch.tensor(list(ratings_dict.values()))\n",
    "        user_vector_initial = torch.tensor(model_last_five.pu[user_id])\n",
    "        user_vector = user_vector_initial\n",
    "        user_vector_pre = user_vector.detach().clone()\n",
    "        user_vector_post = user_vector.detach().clone()\n",
    "        time_max = past_time\n",
    "        already_rated = list(user_item_rating_dict[user_id].keys())\n",
    "        already_rated = already_rated[:-past_time]\n",
    "        ratings_old = rating_tensor[:-past_time]\n",
    "        n = len(ratings_old)\n",
    "        zeros_to_add = torch.zeros(time_max)\n",
    "        ratings = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        ####\n",
    "        ratings_pre = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        ratings_post = torch.cat((ratings_old, zeros_to_add), dim=0)\n",
    "        ####\n",
    "        for timestep in range(0,time_max):\n",
    "            curr_item = chosen_items[timestep]\n",
    "            ratings[n+timestep] = user_action_clamped[timestep]\n",
    "            ####\n",
    "            ratings_pre[n+timestep] = user_action_pre_clamped[timestep]\n",
    "            ratings_post[n+timestep] = user_action_post_clamped[timestep]\n",
    "            ####\n",
    "            already_rated.append(curr_item)\n",
    "            user_vector = update_user_tensor_five(user_vector, already_rated, ratings[:n+timestep+1])\n",
    "            ####\n",
    "            user_vector_pre = update_user_tensor_five(user_vector, already_rated, ratings_pre[:n+timestep+1])\n",
    "            user_vector_post = update_user_tensor_five(user_vector, already_rated, ratings_post[:n+timestep+1])\n",
    "            # print(user_vector_pre)\n",
    "            # print(user_vector_post)\n",
    "            ####\n",
    "        item_rating = -torch.exp(0.8*torch.matmul(user_vector, torch.tensor(model_last_five.qi[item_to_be_reached])))\n",
    "        ####\n",
    "        total_sum_pre = 0\n",
    "        for item in range(len(model_last_five.qi)):\n",
    "            total_sum_pre += torch.exp(0.8 * torch.matmul(user_vector_pre, torch.tensor(model_last_five.qi[item])))\n",
    "        total_sum_post = 0\n",
    "        for item in range(len(model_last_five.qi)):\n",
    "            total_sum_post += torch.exp(0.8 * torch.matmul(user_vector_post, torch.tensor(model_last_five.qi[item])))\n",
    "        item_rating_pre = -torch.exp(0.8*torch.matmul(user_vector_pre, torch.tensor(model_last_five.qi[item_to_be_reached])))/total_sum_pre\n",
    "        item_rating_post = -torch.exp(0.8*torch.matmul(user_vector_post, torch.tensor(model_last_five.qi[item_to_be_reached])))/total_sum_post\n",
    "        proj_grad = (item_rating_post - item_rating_pre)/(2*1)\n",
    "        # torch.manual_seed(0)\n",
    "        print(item_rating)\n",
    "        # print(proj_grad)\n",
    "        # print(user_action)\n",
    "        #user_action = user_action.clamp(1, 5) \n",
    "        for i in range(0,len(user_action)):\n",
    "            #z_temp = torch.randn(1)\n",
    "            user_action[i] = user_action[i] - 500000*proj_grad*z_temp\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(model_last_five.qi)):\n",
    "        total_sum += torch.exp(0.8 * torch.matmul(user_vector, torch.tensor(model_last_five.qi[item])))\n",
    "    return final_rating/total_sum"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "-torch.exp(0.8*torch.matmul(torch.tensor(model_last_five.pu[20]), torch.tensor(model_last_five.qi[25])))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mezo_past_user_item_reachability(275,28,5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trainset.ur[10][-1:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print('hi')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def mezo_past_k_stability(adversary, curr_user, k):\n",
    "    torch.manual_seed(0)\n",
    "    file_path = 'surprise_model_last_five.dump'\n",
    "    # Load the saved model\n",
    "    _, model_last_five = dump.load(file_path)\n",
    "    item_and_rating = trainset.ur[adversary][-k:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64)\n",
    "    item_vector_copy = torch.tensor(model_last_five.qi) #change as per k\n",
    "    user_vector = torch.tensor(model_last_five.pu[curr_user])\n",
    "    initial_rec_list = get_all_preferences(user_vector, item_vector_copy)\n",
    "    initial_rec_list_softmax = F.softmax(initial_rec_list)\n",
    "    #print(initial_rec_list)\n",
    "    n_epochs = 50\n",
    "    distance_metric = None\n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        ####\n",
    "        z_temp = torch.randn(1)\n",
    "        user_action_post = perturb_parameters(user_action, 0.1, 0, z_temp)\n",
    "        user_action_pre = perturb_parameters(user_action, -0.1, 0, z_temp)\n",
    "        # print(user_action_post)\n",
    "        # print(user_action_pre)\n",
    "        user_action_post_clamped = user_action_post.clamp(1,5)\n",
    "        user_action_pre_clamped = user_action_pre.clamp(1,5)\n",
    "        ####\n",
    "        item_vector_copy_tensor = torch.tensor(model_last_five.qi) #change as per k\n",
    "        item_vector_pre = item_vector_copy_tensor.detach().clone()\n",
    "        item_vector_post = item_vector_copy_tensor.detach().clone()\n",
    "        for loop_var in range(0,k):\n",
    "            curr_item = chosen_items[loop_var]\n",
    "            user_list = [item_user_matrix5[curr_item][i][0] for i in range(len(item_user_matrix5[curr_item]))] #change as per k\n",
    "            #print(user_list)\n",
    "            rating_list = torch.tensor([item_user_matrix5[curr_item][i][1] for i in range(len(item_user_matrix5[curr_item]))], dtype = torch.float64) #change as per k\n",
    "            user_list.append(adversary)\n",
    "            ####\n",
    "            rating_list_pre = torch.cat((rating_list, user_action_pre_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "            rating_list_post = torch.cat((rating_list, user_action_post_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "            ####\n",
    "            rating_list = torch.cat((rating_list, user_action_clamped[loop_var].unsqueeze(0)), dim=0)\n",
    "            item_vector_copy_tensor[curr_item] = update_item_tensor_five(item_vector_copy_tensor[curr_item], user_list, rating_list)\n",
    "            ####\n",
    "            item_vector_pre[curr_item] = update_item_tensor_five(item_vector_pre[curr_item], user_list, rating_list_pre)\n",
    "            item_vector_post[curr_item] = update_item_tensor_five(item_vector_post[curr_item], user_list, rating_list_post)\n",
    "            ####\n",
    "        final_rec_list = get_all_preferences(user_vector, item_vector_copy_tensor)\n",
    "        # print(\"Unequal elements:\")\n",
    "        # for i in range(len(initial_rec_list)):\n",
    "        #     if initial_rec_list[i] != final_rec_list[i]:\n",
    "        #         print(f\"Index {i}: Initial - {initial_rec_list[i]}, Final - {final_rec_list[i]}\")\n",
    "        #print(final_rec_list)\n",
    "        ####\n",
    "        final_rec_list_pre = get_all_preferences(user_vector, item_vector_pre)\n",
    "        final_rec_list_post = get_all_preferences(user_vector, item_vector_post)\n",
    "        # print(final_rec_list_pre)\n",
    "        # print(final_rec_list_post)\n",
    "        ####\n",
    "        final_rec_list_pre_softmax = F.softmax(final_rec_list_pre)\n",
    "        final_rec_list_post_softmax = F.softmax(final_rec_list_post)\n",
    "        final_rec_list_softmax = F.softmax(final_rec_list)\n",
    "        distance_metric = -hellinger_distance(final_rec_list_softmax,initial_rec_list_softmax)\n",
    "        print(distance_metric)\n",
    "        d_pre = -hellinger_distance(final_rec_list_pre_softmax,initial_rec_list_softmax)\n",
    "        d_post = -hellinger_distance(final_rec_list_post_softmax,initial_rec_list_softmax)\n",
    "        proj_grad = (d_post-d_pre)/(2*0.1)\n",
    "        print(proj_grad)\n",
    "        # torch.manual_seed(0)\n",
    "        for i in range(0,len(user_action)):\n",
    "            # z_temp = torch.randn(1)\n",
    "            user_action[i] = user_action[i] - 20000*proj_grad*z_temp\n",
    "        #print(user_action_clamped)\n",
    "    return distance_metric.item()\n",
    "    \n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "mezo_past_k_stability(201,2568,5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "RNN"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#okay reachability first\n",
    "#the user vector will now be the user vector ignoring the last five interactions\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = ratings_df[['user_int', 'movie_id', 'rating']]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "import numpy as np\n",
    "from torch.autograd import Variable\n",
    "\n",
    "class RRN(nn.Module):\n",
    "    def __init__(self):\n",
    "        super(RRN, self).__init__()\n",
    "\n",
    "        # Hyperparameters\n",
    "        self.batch_size = 500\n",
    "        self.n_step = 1\n",
    "        self.lr = 0.001\n",
    "        self.verbose = 100\n",
    "\n",
    "        # Data\n",
    "        dataSet = data # \n",
    "        a = dataSet\n",
    "        self.train = a.values\n",
    "        #print(self.train.shape)\n",
    "        # print(len(np.unique(self.train[:, 1])))\n",
    "        #self.valid = b.values\n",
    "\n",
    "        # Model\n",
    "        self.add_embedding_layer()\n",
    "\n",
    "        # Loss and Optimizer\n",
    "        self.criterion = nn.MSELoss()\n",
    "        self.optimizer = optim.Adam(self.parameters(), lr=self.lr)\n",
    "\n",
    "    def save_model(self):\n",
    "        # Save the model\n",
    "        torch.save(self.state_dict(), \"rrn_model_2.pth\")\n",
    "        print(\"Model saved\")\n",
    "\n",
    "    def add_embedding_layer(self):\n",
    "        self.user_embedding = nn.Embedding(6040, 128)\n",
    "        self.movie_embedding = nn.Embedding(3706, 128)\n",
    "        self.user_rnn = nn.GRU(128, 128, batch_first=True)\n",
    "        self.movie_rnn = nn.GRU(128, 128, batch_first=True)\n",
    "        self.user_output_layer = nn.Linear(128, 64)\n",
    "        self.movie_output_layer = nn.Linear(128, 64)\n",
    "\n",
    "    def forward(self, userID, movieID):\n",
    "        uid_embedding = self.user_embedding(userID)\n",
    "        mid_embedding = self.movie_embedding(movieID)\n",
    "\n",
    "        user_rnn_output, _ = self.user_rnn(mid_embedding)\n",
    "        movie_rnn_output, _ = self.movie_rnn(uid_embedding)\n",
    "\n",
    "        #user_output = self.user_output_layer(user_rnn_output[:, -1, :])\n",
    "        user_output = self.user_output_layer(user_rnn_output)\n",
    "        movie_output = self.movie_output_layer(movie_rnn_output)\n",
    "\n",
    "        pred = torch.sum(user_output * movie_output, dim=1, keepdim=True)\n",
    "\n",
    "        return pred\n",
    "\n",
    "    def run(self):\n",
    "        length = len(self.train)\n",
    "        batches = length // self.batch_size + 1\n",
    "\n",
    "        train_loss = []\n",
    "        valid_loss = []\n",
    "\n",
    "        for i in range(batches):\n",
    "            minIdx = i * self.batch_size\n",
    "            maxIdx = min(length, (i + 1) * self.batch_size)\n",
    "            train_batch = self.train[minIdx:maxIdx]\n",
    "            feed_dict_train = self.create_feed_dict(train_batch)\n",
    "\n",
    "            outputs = self.forward(feed_dict_train['userID'], feed_dict_train['movieID'])\n",
    "            # print(outputs.shape)\n",
    "            # print(outputs)\n",
    "            # print(feed_dict_train['rating'].shape)\n",
    "            # print(feed_dict_train['rating'].view(-1,1))\n",
    "            loss = self.criterion(outputs, feed_dict_train['rating'].view(-1,1))\n",
    "            train_loss.append(loss.item())\n",
    "\n",
    "            self.optimizer.zero_grad()\n",
    "            loss.backward()\n",
    "            self.optimizer.step()\n",
    "\n",
    "            if i % self.verbose == 0:\n",
    "                print('\\rTraining: Batch {}/{} - Loss: {:.4f}'.format(\n",
    "                    i, batches, np.sqrt(np.mean(train_loss[-20:]))\n",
    "                ), end='')\n",
    "\n",
    "            # Check validation loss every verbose steps\n",
    "            #if i % self.verbose == 0 and i != 0:\n",
    "                #feed_dict_valid = self.create_feed_dict(self.valid)\n",
    "                #outputs_valid = self.forward(feed_dict_valid['userID'], feed_dict_valid['movieID'])\n",
    "                #valid_loss_epoch = self.criterion(outputs_valid, feed_dict_valid['rating'].view(-1,1)).item()\n",
    "                #valid_loss.append(np.sqrt(valid_loss_epoch))\n",
    "                #print(' - Validation Loss: {:.4f}'.format(valid_loss[-1]), end='')\n",
    "\n",
    "        print(\"\\nTraining Finish, Last 2000 batches loss is {}.\".format(\n",
    "            np.sqrt(np.mean(train_loss[-2000:]))\n",
    "        ))\n",
    "        #feed_dict_valid = self.create_feed_dict(self.valid)\n",
    "        #outputs_valid = self.forward(feed_dict_valid['userID'], feed_dict_valid['movieID'])\n",
    "        #valid_loss_epoch = self.criterion(outputs_valid, feed_dict_valid['rating'].view(-1,1)).item()\n",
    "        #print(\"Validation Loss: {:.4f}\".format(np.sqrt(valid_loss_epoch)))\n",
    "        self.save_model()\n",
    "\n",
    "    def create_feed_dict(self, data):\n",
    "        userID = torch.LongTensor([i[0] - 1 for i in data])\n",
    "        movieID = torch.LongTensor([i[1] - 1 for i in data])\n",
    "        ratings = torch.FloatTensor([float(i[2]) for i in data])\n",
    "        return {\n",
    "            'userID': userID,\n",
    "            'movieID': movieID,\n",
    "            'rating': ratings,\n",
    "        }\n",
    "\n",
    "\n",
    "# if __name__ == '__main__':\n",
    "#     model = RRN()\n",
    "#     model.run()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "model = RRN()\n",
    "model.load_state_dict(torch.load('rrn_model_3.pth'))\n",
    "# model.eval()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_user_item_reachability_rnn(model, user_id, item_id, past_time):\n",
    "    model.to('cpu')\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating = trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float32)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "\n",
    "    for epoch in tqdm(range(1, 50)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        # user_vector = model.user_embedding(torch.tensor([user_id]))\n",
    "        # item_vector = model.movie_embedding(torch.tensor([item_to_be_reached]))\n",
    "        for timestep in range(past_time):\n",
    "            for inner_epoch in range(1,40):\n",
    "                model.optimizer.zero_grad()\n",
    "                curr_item = chosen_items[timestep]\n",
    "                curr_rating = user_action_clamped[timestep]\n",
    "                pred_rating = model(torch.LongTensor([user_id]), torch.LongTensor([curr_item]))\n",
    "                diff = model.criterion(pred_rating[0][0], curr_rating)\n",
    "                # print(\"Hello \",diff)\n",
    "                diff.backward(retain_graph=True)\n",
    "                model.optimizer.step()\n",
    "\n",
    "        item_rating = -torch.exp(0.8*model(torch.LongTensor([user_id]), torch.LongTensor([item_to_be_reached])))\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "\n",
    "    # Calculate probability\n",
    "    total_sum = 0\n",
    "    for item in range(model.movie_embedding.weight.shape[0]):\n",
    "        item_r = torch.exp(0.8*model(torch.LongTensor([user_id]), torch.LongTensor([item])))\n",
    "        total_sum += item_r\n",
    "\n",
    "    return final_rating / total_sum"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "past_user_item_reachability_rnn(model, 25, 20, 5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "user_lstm = torch.nn.LSTM(2, 100)\n",
    "item_lstm = torch.nn.LSTM(2, 100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lstm.load_state_dict(torch.load('user_model_val.pth'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_lstm.load_state_dict(torch.load('item_model_val.pth'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = torch.device(\"cpu\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "user_lstm.to(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "item_lstm.to(device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.set_device(6)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch.nn.functional as F\n",
    "def past_user_item_reachability_lstm(user_id, item_id, past_time):\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    \n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating = trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=8)\n",
    "    \n",
    "    item_lstm.to(device)\n",
    "    user_lstm.to(device)\n",
    "    \n",
    "    final_rating = 0\n",
    "    init_val = 0\n",
    "    for epoch in range(1, 5):\n",
    "        user_h = user_item_rating_tensor5[user_id].detach().clone().to(device)\n",
    "        user_action_clamped = user_action.clamp(1, 5).to(device)\n",
    "        rating_tensor = user_h.to(device)\n",
    "        _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "        user_vector_initial = user_vector_initial[-1]\n",
    "        \n",
    "        time_max = past_time\n",
    "        n = len(rating_tensor)\n",
    "        zeros_to_add = torch.zeros(time_max, 1, 2).to(device)\n",
    "        ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "        \n",
    "        for timestep in range(0, time_max):\n",
    "            curr_item = chosen_items[timestep]\n",
    "            ratings[n+timestep][0][0] = curr_item\n",
    "            ratings[n+timestep][0][1] = user_action_clamped[timestep]\n",
    "        _, (user_vector, _) = user_lstm(ratings)\n",
    "        user_vector = user_vector[-1]\n",
    "        item_scores = []\n",
    "        for item_ in range(len(model_last_five.qi)):\n",
    "            item_history_ = item_user_rating_tensor5[item_].to(device)\n",
    "            _, (item_vector_, _) = item_lstm(item_history_)\n",
    "            item_vector_ = item_vector_[-1]\n",
    "            item_score = 0.8 * torch.dot(user_vector.view(-1), item_vector_.view(-1))\n",
    "            item_scores.append(item_score)\n",
    "        # print(item_scores)\n",
    "        item_scores = torch.stack(item_scores)\n",
    "        log_softmax_scores = F.log_softmax(item_scores, dim=0)\n",
    "        target_item_score = log_softmax_scores[item_to_be_reached]\n",
    "        #print(target_item_score)\n",
    "        # print(user_action)\n",
    "        #print(ratings)\n",
    "        if epoch == 1:\n",
    "            init_val = target_item_score.item()\n",
    "        target_item_score.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "        \n",
    "    if init_val!=0:\n",
    "        diff_val = init_val - target_item_score\n",
    "        final_rating = torch.exp(diff_val).item()\n",
    "    return final_rating, target_item_score.item()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_user_item_reachability_lstm(user_id, item_id, past_time):\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    \n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating = trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.8)\n",
    "    \n",
    "    item_lstm.to(device)\n",
    "    user_lstm.to(device)\n",
    "    \n",
    "    final_rating = 0\n",
    "    for epoch in range(1, 5):\n",
    "        item_history = item_user_rating_tensor5[item_to_be_reached].to(device)\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor5[user_id].detach().clone().to(device)\n",
    "        user_action_clamped = user_action.clamp(1, 5).to(device)\n",
    "        rating_tensor = user_h.to(device)\n",
    "        _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "        user_vector_initial = user_vector_initial[-1]\n",
    "        user_vector = user_vector_initial\n",
    "        \n",
    "        time_max = past_time\n",
    "        n = len(rating_tensor)\n",
    "        zeros_to_add = torch.zeros(time_max, 1, 2).to(device)\n",
    "        ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "        \n",
    "        for timestep in range(0, time_max):\n",
    "            curr_item = chosen_items[timestep]\n",
    "            ratings[n+timestep][0][0] = curr_item\n",
    "            ratings[n+timestep][0][1] = user_action_clamped[timestep]\n",
    "        _, (user_vector, _) = user_lstm(ratings[:n+time_max])\n",
    "        user_vector = user_vector[-1]\n",
    "        # print(ratings[n:])\n",
    "        total_sum = 0\n",
    "        for item_ in range(len(model_last_five.qi)):\n",
    "            item_history_ = item_user_rating_tensor5[item_].to(device)\n",
    "            _, (item_vector_, _) = item_lstm(item_history_)\n",
    "            item_vector_ = item_vector_[-1]\n",
    "            total_sum += torch.exp(0.8 * torch.dot(user_vector.view(-1), item_vector_.view(-1)))\n",
    "        item_rating = -torch.exp(0.8 * torch.dot(user_vector.view(-1), item_vector.view(-1)))/total_sum\n",
    "        print(item_rating)\n",
    "        print(user_action)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "        \n",
    "    final_rating = -item_rating.item() \n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_user_item_reachability_lstm(user_id, item_id, past_time):\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating =  trainset.ur[user_id][-past_time:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=8)\n",
    "    # reach_probabilities = []\n",
    "    \n",
    "    final_rating=0\n",
    "    for epoch in range(1, 50):\n",
    "        item_history = item_user_rating_tensor5[item_to_be_reached]\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor5[user_id].detach().clone()\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        rating_tensor = user_h\n",
    "        _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "        user_vector_initial = user_vector_initial[-1]\n",
    "        # user_vector_initial = torch.tensor(model_last_five.pu[user_id])\n",
    "        user_vector = user_vector_initial\n",
    "        time_max = past_time\n",
    "        n = len(rating_tensor)\n",
    "        zeros_to_add = torch.zeros(time_max, 1, 2)\n",
    "        ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "        for timestep in range(0,time_max):\n",
    "            curr_item = chosen_items[timestep]\n",
    "            ratings[n+timestep][0][0] = curr_item\n",
    "            ratings[n+timestep][0][1] = user_action_clamped[timestep]\n",
    "        _, (user_vector, _) = user_lstm(ratings[:n+time_max])\n",
    "        user_vector = user_vector[-1]\n",
    "        item_rating = -torch.exp(0.8*torch.dot(user_vector.view(-1), item_vector.view(-1)))\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "        #user_action = user_action.clamp(1, 5) \n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(model_last_five.qi)):\n",
    "        item_history = item_user_rating_tensor5[item]\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        total_sum += torch.exp(0.8*torch.dot(user_vector.view(-1), item_vector.view(-1)))\n",
    "    return final_rating/total_sum"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.set_printoptions(precision=14)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "past_user_item_reachability_lstm(300,43,5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "-7.88623142242432 + 7.88564205169678"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.exp(0.0005893707275399507)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "len(item_user_rating_tensor)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "item_lstm.to(device)\n",
    "\n",
    "all_item_vectors = []\n",
    "n_items = len(item_user_rating_tensor)\n",
    "for i in tqdm(range(0, n_items)):\n",
    "    item_history = item_user_rating_tensor[i].to(device)\n",
    "    _, (item_vector, _) = item_lstm(item_history)\n",
    "    item_vector = item_vector[-1]\n",
    "    all_item_vectors.append(item_vector)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# all_item_vectors = []\n",
    "# n_items = len(item_user_rating_tensor)\n",
    "# for i in tqdm(range(0,n_items)):\n",
    "#     item_history = item_user_rating_tensor[i]\n",
    "#     _, (item_vector, _) = item_lstm(item_history)\n",
    "#     item_vector = item_vector[-1]\n",
    "#     all_item_vectors.append(item_vector)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# file = open('allitems', 'wb')\n",
    "\n",
    "# # dump information to that file\n",
    "# pickle.dump(all_item_vectors, file)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "item_lstm.to(device)\n",
    "\n",
    "all_item_vectors1 = []\n",
    "n_items = len(item_user_rating_tensor1)\n",
    "for i in tqdm(range(0,n_items)):\n",
    "    item_history = item_user_rating_tensor1[i].to(device)\n",
    "    _, (item_vector, _) = item_lstm(item_history)\n",
    "    item_vector = item_vector[-1]\n",
    "    all_item_vectors1.append(item_vector)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "item_lstm.to(device)\n",
    "\n",
    "all_item_vectors5 = []\n",
    "n_items = len(item_user_rating_tensor5)\n",
    "for i in tqdm(range(0,n_items)):\n",
    "    item_history = item_user_rating_tensor5[i].to(device)\n",
    "    _, (item_vector, _) = item_lstm(item_history)\n",
    "    item_vector = item_vector[-1]\n",
    "    all_item_vectors5.append(item_vector)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_all_recommendation_scores_lstm(user_vector, sample_size, beta = 0.8):\n",
    "    num_samples = sample_size\n",
    "    n_items = len(item_user_rating_tensor)\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}  \n",
    "    for item in range(0, n_items):\n",
    "        item_rating = torch.dot(user_vector.view(-1), all_item_vectors[item].view(-1))\n",
    "        predicted_ratings[item] = item_rating       \n",
    "    \n",
    "    # Convert the predicted ratings dictionary to PyTorch tensor\n",
    "    ratings_tensor_1 = torch.tensor(list(predicted_ratings.values()), dtype=torch.float)\n",
    "    \n",
    "    # Compute probabilities proportional to exp(beta*predicted_rating)\n",
    "    probabilities = F.softmax(beta * ratings_tensor_1, dim=0)\n",
    "    \n",
    "    # Sample num_samples items based on the probability distribution\n",
    "    sampled_indices = torch.multinomial(probabilities, num_samples, replacement=False)\n",
    "    \n",
    "    # Convert indices to item names and corresponding predicted scores\n",
    "    sampled_items = [list(predicted_ratings.keys())[idx] for idx in sampled_indices]\n",
    "    sampled_scores = [list(predicted_ratings.values())[idx] for idx in sampled_indices]\n",
    "    \n",
    "    return sampled_items, sampled_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_top_recommendations_lstm(user_vector, sample_size, beta=0.8):\n",
    "    n_items = len(item_user_rating_tensor)\n",
    "    predicted_ratings = {index: None for index in range(0, n_items)}\n",
    "\n",
    "    for item in range(0, n_items):\n",
    "        item_rating = torch.dot(user_vector.view(-1), all_item_vectors[item].view(-1))\n",
    "        predicted_ratings[item] = item_rating\n",
    "\n",
    "    # Sort the predicted ratings in descending order\n",
    "    sorted_ratings = sorted(predicted_ratings.items(), key=lambda x: x[1], reverse=True)\n",
    "\n",
    "    # # Get the top sample_size items and their corresponding scores\n",
    "    # top_items = [item for item, score in sorted_ratings[:sample_size]]\n",
    "    # top_scores = [score for item, score in sorted_ratings[:sample_size]]\n",
    "\n",
    "    return sorted_ratings[0][0], sorted_ratings[0][1]\n",
    "    # return top_items, top_scores"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#deterministic\n",
    "#this is the one\n",
    "#big parameter list\n",
    "\n",
    "def future_user_item_reachability_lstm(user_id, item_id, future_time):\n",
    "    torch.cuda.set_device(5)\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    item_lstm.to(device)\n",
    "    user_lstm.to(device)\n",
    "\n",
    "    item_to_be_reached = item_id\n",
    "    chosen_ratings = [5] * future_time * len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "\n",
    "    final_rating = 0\n",
    "    for epoch in range(1, 5):\n",
    "        rating_vals = torch.zeros(10).to(device)\n",
    "        item_history = item_user_rating_tensor[item_to_be_reached].to(device)\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor[user_id].detach().clone().to(device)\n",
    "\n",
    "        for int_var in range(0, len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = user_h\n",
    "            _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "            user_vector_initial = user_vector_initial[-1]\n",
    "            user_vector = user_vector_initial\n",
    "\n",
    "            time_max = future_time\n",
    "            n = len(rating_tensor)\n",
    "            zeros_to_add = torch.zeros(time_max, 1, 2).to(device)\n",
    "            ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "\n",
    "            for timestep in range(0, time_max):\n",
    "                recommendation, recommendation_score = get_top_recommendations_lstm(user_vector, sample_size=1)\n",
    "                ratings[n+timestep][0][0] = recommendation\n",
    "                ratings[n+timestep][0][1] = user_action_clamped[5*recommendation+timestep]\n",
    "                _, (user_vector, _) = user_lstm(ratings[:n+timestep+1])\n",
    "                user_vector = user_vector[-1]\n",
    "            item_scores = []\n",
    "            for item_ in range(len(model.qi)):\n",
    "                item_history_ = item_user_rating_tensor[item_].to(device)\n",
    "                _, (item_vector_, _) = item_lstm(item_history_)\n",
    "                item_vector_ = item_vector_[-1]\n",
    "                item_score = 0.8 * torch.dot(user_vector.view(-1), item_vector_.view(-1))\n",
    "                item_scores.append(item_score)\n",
    "            # print(item_scores)\n",
    "            item_scores = torch.stack(item_scores)\n",
    "            log_softmax_scores = F.log_softmax(item_scores, dim=0)\n",
    "            rating_vals[int_var] = log_softmax_scores[item_to_be_reached]\n",
    "\n",
    "        item_rating = sum(rating_vals) / len(rating_vals)\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "\n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def future_user_item_reachability_lstm(user_id, item_id, future_time):\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    item_lstm.to(device)\n",
    "    user_lstm.to(device)\n",
    "\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating = trainset.ur[user_id][-future_time:]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "\n",
    "    final_rating = 0\n",
    "    for epoch in range(1, 50):\n",
    "        rating_vals = torch.zeros(100).to(device)\n",
    "        item_history = item_user_rating_tensor[item_to_be_reached].to(device)\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor[user_id].detach().clone().to(device)\n",
    "\n",
    "        for int_var in range(0, len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = user_h\n",
    "            _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "            user_vector_initial = user_vector_initial[-1]\n",
    "            user_vector = user_vector_initial\n",
    "\n",
    "            time_max = future_time\n",
    "            n = len(rating_tensor)\n",
    "            zeros_to_add = torch.zeros(time_max, 1, 2).to(device)\n",
    "            ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "\n",
    "            for timestep in range(0, time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_lstm(user_vector, sample_size=1)\n",
    "                ratings[n+timestep][0][0] = recommendation[0]\n",
    "                ratings[n+timestep][0][1] = user_action_clamped[timestep]\n",
    "                _, (user_vector, _) = user_lstm(ratings[:n+1])\n",
    "                user_vector = user_vector[-1]\n",
    "\n",
    "            rating_vals[int_var] = -torch.exp(0.8 * torch.dot(user_vector.view(-1), item_vector.view(-1)))\n",
    "\n",
    "        item_rating = sum(rating_vals) / len(rating_vals)\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "        final_rating = -item_rating.item()\n",
    "\n",
    "    total_sum = 0\n",
    "    for item in range(len(item_user_rating_tensor)):\n",
    "        total_sum += torch.exp(0.8 * torch.dot(user_vector.view(-1), all_item_vectors[item].to(device).view(-1)))\n",
    "\n",
    "    return final_rating / total_sum.item()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#modified version with more samples for more stable gradient\n",
    "\n",
    "def future_user_item_reachability_lstm(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    item_and_rating =  trainset.ur[user_id][-future_time:]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    final_rating=0\n",
    "    for epoch in range(1, 50):\n",
    "        rating_vals =torch.zeros(100)\n",
    "        item_history = item_user_rating_tensor[item_to_be_reached]\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor[user_id].detach().clone()\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = user_h\n",
    "            _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "            user_vector_initial = user_vector_initial[-1]\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            n = len(rating_tensor)\n",
    "            zeros_to_add = torch.zeros(time_max, 1, 2)\n",
    "            ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_lstm(user_vector, sample_size=1)\n",
    "                ratings[n+timestep][0][0] = recommendation[0]\n",
    "                ratings[n+timestep][0][1] = user_action_clamped[timestep]\n",
    "                _, (user_vector, _) = user_lstm(ratings[:n+1])\n",
    "                user_vector = user_vector[-1]\n",
    "            rating_vals[int_var] = -torch.exp(0.8*torch.dot(user_vector.view(-1), item_vector.view(-1)))\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(item_user_rating_tensor)):\n",
    "        total_sum += torch.exp(0.8*torch.dot(user_vector.view(-1), all_item_vectors[item].view(-1)))\n",
    "    return final_rating/total_sum  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "torch.cuda.set_device(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#nah this is final frfr\n",
    "\n",
    "def future_user_item_reachability_lstm(user_id, item_id, future_time):\n",
    "    torch.cuda.set_device(5)\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    item_lstm.to(device)\n",
    "    user_lstm.to(device)\n",
    "\n",
    "    item_to_be_reached = item_id\n",
    "    chosen_ratings = [5] * future_time * len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=4)\n",
    "\n",
    "    final_rating = 0\n",
    "\n",
    "    # Precompute item vectors\n",
    "    with torch.no_grad():\n",
    "        item_vectors = []\n",
    "        for item_ in range(len(model.qi)):\n",
    "            item_history_ = item_user_rating_tensor[item_].to(device)\n",
    "            _, (item_vector_, _) = item_lstm(item_history_)\n",
    "            item_vector_ = item_vector_[-1]\n",
    "            item_vectors.append(item_vector_)\n",
    "        item_vectors = torch.stack(item_vectors)\n",
    "\n",
    "    for epoch in range(1, 5):\n",
    "        user_h = user_item_rating_tensor[user_id].detach().clone().to(device)\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        rating_tensor = user_h\n",
    "        _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "        user_vector_initial = user_vector_initial[-1]\n",
    "        user_vector = user_vector_initial\n",
    "\n",
    "        time_max = future_time\n",
    "        n = len(rating_tensor)\n",
    "        zeros_to_add = torch.zeros(time_max, 1, 2).to(device)\n",
    "        ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "\n",
    "        for timestep in range(0, time_max):\n",
    "            recommendation, recommendation_score = get_top_recommendations_lstm(user_vector, sample_size=1)\n",
    "            ratings[n+timestep][0][0] = recommendation\n",
    "            ratings[n+timestep][0][1] = user_action_clamped[5*recommendation+timestep]\n",
    "            _, (user_vector, _) = user_lstm(ratings[:n+timestep+1])\n",
    "            user_vector = user_vector[-1]\n",
    "\n",
    "        item_scores = []\n",
    "        for item_vector_ in item_vectors:\n",
    "            item_score = torch.dot(user_vector.view(-1), item_vector_.view(-1))\n",
    "            item_scores.append(item_score)\n",
    "        item_scores = torch.stack(item_scores)\n",
    "        log_softmax_scores = F.log_softmax(item_scores, dim=0)\n",
    "        item_rating = log_softmax_scores[item_to_be_reached]\n",
    "        print(user_action)\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "\n",
    "    return final_rating"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_user_item_reachability_lstm(200,52,5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#modified version with more samples for more stable gradient\n",
    "\n",
    "def future_user_item_reachability_lstm2(user_id, item_id, future_time):\n",
    "    item_to_be_reached = item_id\n",
    "    chosen_ratings = [5.0]*len(item_user_rating_tensor)\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    # reach_probabilities = []\n",
    "    final_rating=0\n",
    "    for epoch in range(1, 50):\n",
    "        rating_vals =torch.zeros(100)\n",
    "        item_history = item_user_rating_tensor[item_to_be_reached]\n",
    "        _, (item_vector, _) = item_lstm(item_history)\n",
    "        item_vector = item_vector[-1]\n",
    "        user_h = user_item_rating_tensor[user_id].detach().clone()\n",
    "        for int_var in range(0,len(rating_vals)):\n",
    "            user_action_clamped = user_action.clamp(1, 5)\n",
    "            rating_tensor = user_h\n",
    "            _, (user_vector_initial, _) = user_lstm(rating_tensor)\n",
    "            user_vector_initial = user_vector_initial[-1]\n",
    "            user_vector = user_vector_initial\n",
    "            time_max = future_time\n",
    "            n = len(rating_tensor)\n",
    "            zeros_to_add = torch.zeros(time_max, 1, 2)\n",
    "            ratings = torch.cat((rating_tensor, zeros_to_add), dim=0)\n",
    "            for timestep in range(0,time_max):\n",
    "                recommendation, recommendation_score = get_all_recommendation_scores_lstm(user_vector, sample_size=1)\n",
    "                ratings[n+timestep][0][0] = recommendation[0]\n",
    "                ratings[n+timestep][0][1] = user_action_clamped[recommendation]\n",
    "                _, (user_vector, _) = user_lstm(ratings[:n+1])\n",
    "                user_vector = user_vector[-1]\n",
    "            rating_vals[int_var] = -torch.exp(0.8*torch.dot(user_vector.view(-1), item_vector.view(-1)))\n",
    "        item_rating = sum(rating_vals)/len(rating_vals)\n",
    "        print(item_rating)\n",
    "        item_rating.backward()\n",
    "        optimizer.step()\n",
    "        # print(user_action)\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    final_rating = -item_rating.item()\n",
    "    #now get probability\n",
    "    total_sum = 0\n",
    "    for item in range(len(item_user_rating_tensor)):\n",
    "        total_sum += torch.exp(0.8*torch.dot(user_vector.view(-1), all_item_vectors[item].view(-1)))\n",
    "    return final_rating/total_sum  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_all_preferences_lstm(user_vector_1, item_vector_copy_h):\n",
    "    # Compute ratings for each item by dot product with user_vector\n",
    "    temp_vector = user_vector_1.detach().clone()\n",
    "    item_ratings = torch.matmul(torch.stack(item_vector_copy_h), temp_vector.transpose(0,1))\n",
    "    return item_ratings.squeeze(1) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def hellinger_distance(p, q):\n",
    "    return torch.sqrt(torch.sum((torch.sqrt(p) - torch.sqrt(q)) ** 2)) / torch.sqrt(torch.tensor(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_k_stability_lstm(adversary, curr_user, k):\n",
    "    item_and_rating =  trainset.ur[adversary][-k:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    item_vector_copy = all_item_vectors1.copy() #change as per k\n",
    "    \n",
    "    user_history = user_item_rating_tensor1[curr_user]\n",
    "    _, (user_vector, _) = user_lstm(user_history)\n",
    "    user_vector = user_vector[-1]\n",
    "    \n",
    "    initial_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy)\n",
    "    n_epochs = 50\n",
    "    distance_metric = None\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        item_vector_copy_tensor = all_item_vectors1.copy() #change as per k\n",
    "        for loop_var in range(0,k):\n",
    "            curr_item = chosen_items[loop_var]\n",
    "            user_list = item_user_rating_tensor1[curr_item]\n",
    "            \n",
    "            n = len(user_list)\n",
    "            zeros_to_add = torch.zeros(1, 1, 2)\n",
    "            ratings = torch.cat((user_list, zeros_to_add), dim=0)\n",
    "            ratings[n][0][0] = curr_item\n",
    "            ratings[n][0][1] = user_action_clamped[loop_var]\n",
    "            _, (item_vector_, _) = item_lstm(ratings[:n+1])\n",
    "            \n",
    "            item_vector_copy_tensor[curr_item] = item_vector_[-1]\n",
    "        \n",
    "        final_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy_tensor)\n",
    "        distance_metric = -hellinger_distance(final_rec_list,initial_rec_list)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    return distance_metric.item()\n",
    "    \n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def past_k_stability_lstm(adversary, curr_user, k):\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "    \n",
    "    item_and_rating = trainset.ur[adversary][-k:]\n",
    "    chosen_items = [i[0] for i in item_and_rating]\n",
    "    chosen_ratings = [i[1] for i in item_and_rating]\n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=8)\n",
    "    \n",
    "    item_vector_copy = [vec.to(device) for vec in all_item_vectors5]  # Move item vectors to GPU\n",
    "    user_history = user_item_rating_tensor1[curr_user].to(device)  # Move user history to GPU\n",
    "    _, (user_vector, _) = user_lstm(user_history)\n",
    "    user_vector = user_vector[-1]\n",
    "    \n",
    "    initial_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy).detach()\n",
    "    initial_rec_list_softmax = F.softmax(initial_rec_list, dim=0)\n",
    "    \n",
    "    n_epochs = 20\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        item_vector_copy_tensor = [vec.clone().detach().requires_grad_(True) for vec in item_vector_copy]\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        for loop_var in range(0, k):\n",
    "            curr_item = chosen_items[loop_var]\n",
    "            user_list = item_user_rating_tensor5[curr_item].detach().clone().to(device)  # Move user list to GPU\n",
    "            n = len(user_list)\n",
    "            zeros_to_add = torch.zeros(1, 1, 2).to(device)  # Create zeros tensor on GPU\n",
    "            ratings = torch.cat((user_list, zeros_to_add), dim=0)\n",
    "            ratings[n][0][0] = curr_item\n",
    "            ratings[n][0][1] = user_action_clamped[loop_var]\n",
    "            _, (item_vector_, _) = item_lstm(ratings[:n+1])\n",
    "            item_vector_copy_tensor[curr_item] = item_vector_[-1]\n",
    "        \n",
    "        final_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy_tensor)\n",
    "        final_rec_list_softmax = F.softmax(final_rec_list, dim=0)\n",
    "        distance_metric = -hellinger_distance(final_rec_list_softmax, initial_rec_list_softmax)\n",
    "        print(distance_metric)\n",
    "        print(user_action)\n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    \n",
    "    return distance_metric.item()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "past_k_stability_lstm(2, 19, 5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def future_k_stability_lstm(adversary, curr_user, k):\n",
    "    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
    "\n",
    "    adversary_history = user_item_rating_tensor[adversary].to(device)\n",
    "    _, (adversary_vector, _) = user_lstm(adversary_history)\n",
    "    adversary_vector = adversary_vector[-1]\n",
    "    chosen_ratings = [5.0] * k * len(model.qi)\n",
    "    user_action = torch.tensor(chosen_ratings, dtype=torch.float64).to(device).clone().detach().requires_grad_(True)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=2)\n",
    "\n",
    "    item_vector_copy = [vec.to(device) for vec in all_item_vectors]  # Move item vectors to GPU\n",
    "    user_history = user_item_rating_tensor[curr_user].to(device)\n",
    "    _, (user_vector, _) = user_lstm(user_history)\n",
    "    user_vector = user_vector[-1]\n",
    "    initial_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy).detach()\n",
    "    initial_rec_list_softmax = F.softmax(initial_rec_list, dim=0)\n",
    "    \n",
    "    n_epochs = 10\n",
    "    distance_metric = None\n",
    "\n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        item_vector_copy_tensor = [vec.clone().detach().requires_grad_(True) for vec in item_vector_copy]\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        for loop_var in range(0, k):\n",
    "            curr_item, _ = get_top_recommendations_lstm(adversary_vector, sample_size=1)\n",
    "            user_list = item_user_rating_tensor[curr_item].detach().clone().to(device)  # Move user list to GPU\n",
    "            n = len(user_list)\n",
    "            zeros_to_add = torch.zeros(1, 1, 2).to(device)  # Create zeros tensor on GPU\n",
    "            ratings = torch.cat((user_list, zeros_to_add), dim=0)\n",
    "            ratings[n][0][0] = curr_item\n",
    "            ratings[n][0][1] = user_action_clamped[loop_var]\n",
    "            _, (item_vector_, _) = item_lstm(ratings[:n+1])\n",
    "            item_vector_copy_tensor[curr_item] = item_vector_[-1]\n",
    "        \n",
    "        final_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy_tensor)\n",
    "        final_rec_list_softmax = F.softmax(final_rec_list, dim=0)\n",
    "        distance_metric = -hellinger_distance(final_rec_list_softmax, initial_rec_list_softmax)\n",
    "        print(distance_metric)\n",
    "        print(user_action)\n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "    return distance_metric.item()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "future_k_stability_lstm(5,8,5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def future_k_stability_lstm2(adversary, curr_user, k):\n",
    "    adversary_history = user_item_rating_tensor1[adversary]\n",
    "    _, (adversary_vector, _) = user_lstm(adversary_history)\n",
    "    adversary_vector = adversary_vector[-1]\n",
    "    \n",
    "    chosen_ratings = [5.0]*len(item_user_rating_tensor)\n",
    "    \n",
    "    user_action = torch.tensor(chosen_ratings, requires_grad=True, dtype=torch.float64)\n",
    "    optimizer = torch.optim.Adam([user_action], lr=0.08)\n",
    "    \n",
    "    item_vector_copy = all_item_vectors1.copy() #change as per k\n",
    "    \n",
    "    user_history = user_item_rating_tensor1[curr_user]\n",
    "    _, (user_vector, _) = user_lstm(user_history)\n",
    "    user_vector = user_vector[-1]\n",
    "    \n",
    "    initial_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy)\n",
    "    n_epochs = 50\n",
    "    distance_metric = None\n",
    "    \n",
    "    for epoch in tqdm(range(0, n_epochs)):\n",
    "        user_action_clamped = user_action.clamp(1, 5)\n",
    "        item_vector_copy_tensor = all_item_vectors1.copy() #change as per k\n",
    "        for loop_var in range(0,k):\n",
    "            curr_item, recommendation_score = get_all_recommendation_scores_lstm(adversary_vector, sample_size=1)\n",
    "            curr_item = curr_item[0]\n",
    "            item_h = item_user_rating_tensor[curr_item]\n",
    "            n = len(item_h)\n",
    "            zeros_to_add = torch.zeros(1, 1, 2)\n",
    "            new_item_h = torch.cat((item_h, zeros_to_add), dim=0)\n",
    "            new_item_h[n][0][0] = curr_item\n",
    "            new_item_h[n][0][1] = user_action_clamped[curr_item]\n",
    "            \n",
    "            _, (item_vector_, _) = item_lstm(new_item_h[:n+1])\n",
    "            item_vector_copy_tensor[curr_item] = item_vector_[-1]\n",
    "            \n",
    "        final_rec_list = get_all_preferences_lstm(user_vector, item_vector_copy_tensor)\n",
    "        distance_metric = -mse(final_rec_list,initial_rec_list)\n",
    "        print(distance_metric)\n",
    "        \n",
    "        distance_metric.backward()\n",
    "        optimizer.step()\n",
    "        optimizer.zero_grad()\n",
    "    return distance_metric.item()\n",
    "            \n",
    "    "
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "py374",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
