{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "editable": true,
    "slideshow": {
     "slide_type": ""
    },
    "tags": []
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import sys\n",
    "sys.path.append('..')\n",
    "from utils.sim_missing_data import *\n",
    "from models.SRPCA import *"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Load Data/Image"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "file_path = '../datasets/movielens-100k-dataset/ml-100k/u.data'\n",
    "movie_rec = np.loadtxt(file_path, delimiter='\\t')#.astype(np.float32)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[1.96000000e+02, 2.42000000e+02, 3.00000000e+00, 8.81250949e+08],\n",
       "       [1.86000000e+02, 3.02000000e+02, 3.00000000e+00, 8.91717742e+08],\n",
       "       [2.20000000e+01, 3.77000000e+02, 1.00000000e+00, 8.78887116e+08],\n",
       "       ...,\n",
       "       [2.76000000e+02, 1.09000000e+03, 1.00000000e+00, 8.74795795e+08],\n",
       "       [1.30000000e+01, 2.25000000e+02, 2.00000000e+00, 8.82399156e+08],\n",
       "       [1.20000000e+01, 2.03000000e+02, 3.00000000e+00, 8.79959583e+08]])"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "movie_rec"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Set parameters"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "perc = 20 # Percentage of missing data\n",
    "seed = 50\n",
    "i_PCA = 4 # Number of Principal Components\n",
    "max_iter = 50 # Maximum number of ierations before breaking\n",
    "alpha = 1 # balancing estimate update parameter\n",
    "eps = 1e-5 # stability infitisimial\n",
    "eps_tol = 1e-3 # convergence threshold\n",
    "optional_smoothing = False # Option smoothening of estimates each iteration\n",
    "Nan = False # put Nan instead or 0 in missing entries\n",
    "return_normalized = True # return a normalized version of the matrix"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Simulate missing data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "X_avail,X_true,X_norm,X_true_norm,OmegaRow,OmegaCol,mu_O_list,std_O_list,rmIndMatrixRow,rmIndMatrixCol = simulate_missing_data_movielens(movie_rec,\n",
    "                                                                                                                                         perc,\n",
    "                                                                                                                                         eps=eps,\n",
    "                                                                                                                                         Nan=Nan,\n",
    "                                                                                                                                         return_normalized=return_normalized,\n",
    "                                                                                                                                         seed=seed)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Algorithm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "#######################################\n",
      "############## SRPCA ##################\n",
      "#######################################\n",
      "Iteration #0, observed error: 0.7818238214252669 hidden error: 0.18819250368392187 time elapsed: 6.8632198257837445\n",
      "Iteration #1, observed error: 0.7643287477220895 hidden error: 0.18664510569797457 time elapsed: 6.957259949995205\n",
      "Iteration #2, observed error: 0.7512340799786076 hidden error: 0.18551435038619868 time elapsed: 7.050122947897762\n",
      "Iteration #3, observed error: 0.7408344887847657 hidden error: 0.18463918595445802 time elapsed: 7.144102283986285\n",
      "Iteration #4, observed error: 0.7322534430387208 hidden error: 0.1839456512328467 time elapsed: 7.2496901887934655\n",
      "Iteration #5, observed error: 0.7249931480897127 hidden error: 0.1833890060299247 time elapsed: 7.342853029957041\n",
      "Iteration #6, observed error: 0.7187389988281997 hidden error: 0.18293502708938097 time elapsed: 7.439146908000112\n",
      "Iteration #7, observed error: 0.7132765791237436 hidden error: 0.18256805506627544 time elapsed: 7.532365038990974\n",
      "Iteration #8, observed error: 0.7084529497637769 hidden error: 0.18225293178059182 time elapsed: 7.625365547835827\n",
      "Iteration #9, observed error: 0.7041554284807057 hidden error: 0.18197243935750843 time elapsed: 7.71950345300138\n",
      "Iteration #10, observed error: 0.7002986365056605 hidden error: 0.18172582999337938 time elapsed: 7.812942088814452\n",
      "Iteration #11, observed error: 0.6968162565038915 hidden error: 0.18151403497087673 time elapsed: 7.906282327836379\n",
      "Iteration #12, observed error: 0.693655656135857 hidden error: 0.18133006444607686 time elapsed: 8.001204033847898\n",
      "Iteration #13, observed error: 0.6907742686746517 hidden error: 0.18116560734274031 time elapsed: 8.097257649991661\n",
      "Iteration #14, observed error: 0.688137071280171 hidden error: 0.181016660941058 time elapsed: 8.190893610008061\n",
      "Iteration #15, observed error: 0.6857147891823036 hidden error: 0.1808856006951484 time elapsed: 8.284850468859076\n",
      "Iteration #16, observed error: 0.6834826151464404 hidden error: 0.18076834336247372 time elapsed: 8.379119330784306\n",
      "Iteration #17, observed error: 0.6814193035748651 hidden error: 0.1806615511568512 time elapsed: 8.475316752912477\n",
      "Iteration #18, observed error: 0.6795065251501732 hidden error: 0.1805620177129409 time elapsed: 8.569590125000104\n",
      "Iteration #19, observed error: 0.677728389609766 hidden error: 0.18047138978339144 time elapsed: 8.662872709799558\n",
      "Iteration #20, observed error: 0.6760710724400365 hidden error: 0.18038762987180426 time elapsed: 8.755970978876576\n",
      "Iteration #21, observed error: 0.6745225086127701 hidden error: 0.18031264340312786 time elapsed: 8.850886639906093\n",
      "Iteration #22, observed error: 0.6730721351407961 hidden error: 0.1802478168149231 time elapsed: 8.94603323796764\n",
      "Iteration #23, observed error: 0.6717106734774421 hidden error: 0.1801906048173665 time elapsed: 9.040322259999812\n",
      "Iteration #24, observed error: 0.6704299460997567 hidden error: 0.1801382907986462 time elapsed: 9.134618324926123\n",
      "Iteration #25, observed error: 0.6692227224674081 hidden error: 0.18008854088946913 time elapsed: 9.232341511873528\n",
      "Iteration #26, observed error: 0.6680825898485082 hidden error: 0.18004107523820131 time elapsed: 9.32599446293898\n",
      "Iteration #27, observed error: 0.667003844898159 hidden error: 0.1799948610685363 time elapsed: 9.42291506798938\n",
      "Iteration #28, observed error: 0.66598140241765 hidden error: 0.1799536475677943 time elapsed: 9.516746619949117\n",
      "Iteration #29, observed error: 0.6650107183009666 hidden error: 0.17991821468922328 time elapsed: 9.625406407983974\n"
     ]
    }
   ],
   "source": [
    "M, tme, total_error =SRPCA_func(X_norm, \n",
    "                                X_true_norm, \n",
    "                                OmegaCoord=[OmegaRow,OmegaCol], \n",
    "                                MissingIndCoord=[rmIndMatrixRow,rmIndMatrixCol],\n",
    "                                DistribProps=[mu_O_list,std_O_list],\n",
    "                                i_PCA=i_PCA, \n",
    "                                alpha=alpha ,\n",
    "                                eps=eps, \n",
    "                                eps_tol=eps_tol, \n",
    "                                optional_smoothing=optional_smoothing,\n",
    "                                verbose=True,\n",
    "                                max_iter=max_iter,\n",
    "                                residErrorType = 'hiddenForMovieLens',\n",
    "                                seed=seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "SRPCA",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
