{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "de626a7a-9492-4fe0-ad94-b525e91d1c84",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/usr/bin/sh: 1: poetry: not found\n"
     ]
    }
   ],
   "source": [
    "!poetry add jsonpickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "55662b9e-7139-4eec-8d7e-1289ea87f728",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Defaulting to user installation because normal site-packages is not writeable\n",
      "Requirement already satisfied: jsonpickle in /home/exp/.local/lib/python3.10/site-packages (3.0.2)\n",
      "Collecting dacite\n",
      "  Obtaining dependency information for dacite from https://files.pythonhosted.org/packages/21/0f/cf0943f4f55f0fbc7c6bd60caf1343061dff818b02af5a0d444e473bb78d/dacite-1.8.1-py3-none-any.whl.metadata\n",
      "  Downloading dacite-1.8.1-py3-none-any.whl.metadata (15 kB)\n",
      "Downloading dacite-1.8.1-py3-none-any.whl (14 kB)\n",
      "Installing collected packages: dacite\n",
      "Successfully installed dacite-1.8.1\n"
     ]
    }
   ],
   "source": [
    "!pip install jsonpickle dacite"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "173ae146-ad1b-44f3-8127-095c22d26817",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Defaulting to user installation because normal site-packages is not writeable\n",
      "Requirement already satisfied: numpy in /opt/conda/lib/python3.10/site-packages (1.26.1)\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "!{sys.executable} -m pip install numpy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "e5146f2f-bfec-47f3-a7eb-707ec930d26c",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/home/exp/src/experiments/model_training/notebooks\n"
     ]
    }
   ],
   "source": [
    "!pwd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "id": "0f121916-71d1-47f5-a73b-a94ff1517786",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "from dataclasses import dataclass\n",
    "\n",
    "import jsonpickle\n",
    "import jsonpickle.ext.pandas as jsonpickle_pandas\n",
    "import dacite\n",
    "import pandas as pd\n",
    "\n",
    "jsonpickle_pandas.register_handlers()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "id": "8b501e02-2889-43a6-8a18-833325c2b966",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "# @jsonpickle.handlers.register(pd.DataFrame, base=True)\n",
    "class PandasHandler(jsonpickle.handlers.BaseHandler):\n",
    "    def flatten(self, df, ser):\n",
    "        path = \"/home/exp/src/experiments/model_training/notebooks/df.parquet\"\n",
    "        df.to_parquet(\n",
    "            path=path,\n",
    "        )\n",
    "        print(ser)\n",
    "        return {\n",
    "            \"py/object\": \"pandas.core.frame.DataFrame\",\n",
    "            \"stored_at\": path,\n",
    "        }\n",
    "        \n",
    "    def restore(self, ser):\n",
    "        path = ser[\"stored_at\"]\n",
    "        df = pd.read_parquet(path)\n",
    "        return df\n",
    "    \n",
    "jsonpickle.handlers.register(pd.DataFrame, PandasHandler, base=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "id": "e1494a55-659f-46ff-a5b3-056100cca5c1",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Data(a=5, b=['a', 'b'], c=   c1  c2\n",
       "0   1   4\n",
       "1   2   5\n",
       "2   3   6)"
      ]
     },
     "execution_count": 81,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "@dataclass\n",
    "class Data:\n",
    "    a: int\n",
    "    b: list[str]\n",
    "    c: pd.DataFrame\n",
    "    \n",
    "obj = Data(5, [\"a\", \"b\"], pd.DataFrame({\"c1\": [1, 2, 3], \"c2\": [4, 5, 6]}))\n",
    "obj"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "id": "6fa5d002-12d7-4d82-a358-a2b5457cb4f7",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{}\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "'{\"a\": 5, \"b\": [\"a\", \"b\"], \"c\": {\"py/object\": \"pandas.core.frame.DataFrame\", \"stored_at\": \"/home/exp/src/experiments/model_training/notebooks/df.parquet\"}}'"
      ]
     },
     "execution_count": 82,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "enc_obj = jsonpickle.encode(obj, unpicklable=False)\n",
    "enc_obj"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 75,
   "id": "443c8543-e627-4cb6-b219-b7c3bd1a075d",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'a': 5,\n",
       " 'b': ['a', 'b'],\n",
       " 'c':    c1  c2\n",
       " 0   1   4\n",
       " 1   2   5\n",
       " 2   3   6}"
      ]
     },
     "execution_count": 75,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "read_obj = jsonpickle.decode(enc_obj)\n",
    "read_obj"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "id": "50fc04f0-6f49-41b7-a9ce-152a21521fb7",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Data(a=5, b=['a', 'b'], c=   c1  c2\n",
       "0   1   4\n",
       "1   2   5\n",
       "2   3   6)"
      ]
     },
     "execution_count": 76,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dacite.from_dict(data_class=Data, data=read_obj)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e590f959-b70a-4469-863c-11ca272069be",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
