{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import sys\n",
    "sys.path.append('..')\n",
    "from utils.sim_missing_data import *\n",
    "from models.FastSRPCA import *"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Load Data/Image"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "file_path = '../datasets/movielens-100k-dataset/ml-100k/u.data'\n",
    "movie_rec = np.loadtxt(file_path, delimiter='\\t')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[1.96000000e+02, 2.42000000e+02, 3.00000000e+00, 8.81250949e+08],\n",
       "       [1.86000000e+02, 3.02000000e+02, 3.00000000e+00, 8.91717742e+08],\n",
       "       [2.20000000e+01, 3.77000000e+02, 1.00000000e+00, 8.78887116e+08],\n",
       "       ...,\n",
       "       [2.76000000e+02, 1.09000000e+03, 1.00000000e+00, 8.74795795e+08],\n",
       "       [1.30000000e+01, 2.25000000e+02, 2.00000000e+00, 8.82399156e+08],\n",
       "       [1.20000000e+01, 2.03000000e+02, 3.00000000e+00, 8.79959583e+08]])"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "movie_rec"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Set parameters"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "perc = 20#[20,30,50,60] # Percentage of missing data\n",
    "seed = 50\n",
    "i_PCA = 4 # Number of Principal Components\n",
    "max_iter = 50 # Maximum number of ierations before breaking\n",
    "alpha = 1 # balancing estimate update parameter\n",
    "delta=0.7\n",
    "eps = 1e-5 # stability infitisimial\n",
    "eps_tol = 1e-3 # convergence threshold\n",
    "optional_smoothing = False # Option smoothening of estimates each iteration\n",
    "Nan = False # put Nan instead of 0 in missing entries\n",
    "return_normalized = True # return a normalized version of the matrix"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Simulate missing data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "X_avail,X_true,X_norm,X_true_norm,OmegaRow,OmegaCol,mu_O_list,std_O_list,rmIndMatrixRow,rmIndMatrixCol = simulate_missing_data_movielens(movie_rec,\n",
    "                                                                                                                                         perc,\n",
    "                                                                                                                                         eps=eps,\n",
    "                                                                                                                                         Nan=Nan,\n",
    "                                                                                                                                         return_normalized=return_normalized,\n",
    "                                                                                                                                         seed=seed)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Algorithm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#######################################\n",
      "############## SRPCA ##################\n",
      "#######################################\n",
      "Iteration #0, observed error: 0.7818238214252669 hidden error: 0.18819250368392187 , alpha 1, time elapsed: 6.781826009042561\n",
      "Iteration #1, observed error: 0.7643287477220895 hidden error: 0.18664510569797457 , alpha 1, time elapsed: 6.88141282601282\n",
      "Iteration #2, observed error: 0.7643287477220895 hidden error: 0.18664510569797457 , alpha 0, time elapsed: 6.999609916005284\n"
     ]
    }
   ],
   "source": [
    "M, tme, total_error =fastSRPCA_func(X_norm, \n",
    "                                 X_true_norm, \n",
    "                                 OmegaCoord=[OmegaRow,OmegaCol], \n",
    "                                 MissingIndCoord=[rmIndMatrixRow,rmIndMatrixCol],\n",
    "                                 DistribProps= [mu_O_list,std_O_list],\n",
    "                                 i_PCA=i_PCA, \n",
    "                                 alpha=alpha , \n",
    "                                 delta=delta,\n",
    "                                 eps=eps, \n",
    "                                 eps_tol=eps_tol, \n",
    "                                 optional_smoothing=optional_smoothing,\n",
    "                                 residErrorType = 'hiddenForMovieLens',\n",
    "                                 verbose=True,\n",
    "                                 seed=seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "SRPCA",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
