{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "Convert the rating matrix into conversion rate matrix;\n",
    "Generate the simulated prediction conversion rate matrix.\n",
    "\"\"\"\n",
    "import pickle\n",
    "import numpy as np\n",
    "\n",
    "file = open(\"data/predicted_matrix\", \"rb\")\n",
    "prediction = np.array(pickle.load(file), dtype=float)\n",
    "user_num = pickle.load(file)\n",
    "item_num = pickle.load(file)\n",
    "file.close()\n",
    "\n",
    "# CVR = [0.1, 0.3, 0.5, 0.7, 0.9]\n",
    "# ratio = [0.53, 0.24, 0.14, 0.06, 0.03] (the same distribution as in Yahoo R3! MAR test set)\n",
    "total_num = prediction.shape[0]\n",
    "index = np.argsort(prediction)\n",
    "index_inverse = np.argsort(index)\n",
    "prediction = prediction[index]\n",
    "\n",
    "a = []\n",
    "a.append(prediction[int(total_num*0.53)])\n",
    "a.append(prediction[int(total_num*0.77)])\n",
    "a.append(prediction[int(total_num*0.91)])\n",
    "a.append(prediction[int(total_num*0.98)])\n",
    "\n",
    "prediction[:int(total_num*0.53)] = 1\n",
    "prediction[int(total_num*0.53):int(total_num*0.77)] = 2\n",
    "prediction[int(total_num*0.77):int(total_num*0.91)] = 3\n",
    "prediction[int(total_num*0.91):int(total_num*0.98)] = 4\n",
    "prediction[int(total_num*0.98):] = 5\n",
    "ground_truth = prediction[index_inverse]\n",
    "\n",
    "# Simulated prediction 1 - ONE\n",
    "n_1 = np.count_nonzero(np.where(ground_truth == 1))\n",
    "n_5 = np.count_nonzero(np.where(ground_truth == 5))\n",
    "select = np.random.choice(n_1, n_5, replace=False)\n",
    "prediction = ground_truth[index]\n",
    "prediction[select] = 5\n",
    "one = prediction[index_inverse]\n",
    "print(one[:50])\n",
    "# Simulated prediction 2 - Three\n",
    "n_3 = np.count_nonzero(np.where(ground_truth == 3))\n",
    "select = np.random.choice(n_3, n_5, replace=False)+int(total_num* 0.77)\n",
    "prediction = ground_truth[index]\n",
    "prediction[select] = 5\n",
    "three = prediction[index_inverse]\n",
    "\n",
    "# Simulated prediction 3 - Four\n",
    "n_4 = np.count_nonzero(np.where(ground_truth == 4))\n",
    "select = np.random.choice(n_4, n_5, replace=False)+int(total_num * 0.91)\n",
    "prediction = ground_truth[index]\n",
    "prediction[select] = 5\n",
    "four = prediction[index_inverse]\n",
    "\n",
    "# Rotate\n",
    "prediction = ground_truth[index]\n",
    "prediction[:int(total_num*0.53)] = 5\n",
    "prediction[int(total_num*0.53):int(total_num*0.77)] = 1\n",
    "prediction[int(total_num*0.77):int(total_num*0.91)] = 2\n",
    "prediction[int(total_num*0.91):int(total_num*0.98)] = 3\n",
    "prediction[int(total_num*0.98):] = 4\n",
    "rotate = prediction[index_inverse]\n",
    "\n",
    "# Simulated prediction 4 - SKEW\n",
    "prediction = np.copy(ground_truth)\n",
    "for i in range(prediction.shape[0]):\n",
    "    prediction[i] = np.random.normal(loc=prediction[i], scale=(6-prediction[i])/2, size=1)\n",
    "skew = np.clip(prediction, 1, 5)\n",
    "\n",
    "# Simulated prediction 5 - CRS\n",
    "prediction = np.copy(ground_truth)\n",
    "select1 = np.where(prediction >= 4)\n",
    "select2 = np.where(prediction < 4)\n",
    "prediction[select1] = 4\n",
    "prediction[select2] = 2\n",
    "crs = prediction\n",
    "print(crs[:20])\n",
    "print(ground_truth[:20])\n",
    "\n",
    "file = open(\"data/synthetic_data\", \"wb\")\n",
    "pickle.dump(ground_truth, file)\n",
    "pickle.dump(one, file)\n",
    "pickle.dump(three, file)\n",
    "pickle.dump(four, file)\n",
    "pickle.dump(rotate, file)\n",
    "pickle.dump(skew, file)\n",
    "pickle.dump(crs, file)\n",
    "pickle.dump(a, file)\n",
    "file.close()\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:root] *",
   "language": "python",
   "name": "conda-root-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
