{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import nbformat\n",
    "from nbconvert.preprocessors import ExecutePreprocessor\n",
    "from nbconvert import NotebookExporter\n",
    "import os\n",
    "import csv\n",
    "os.environ['PYDEVD_DISABLE_FILE_VALIDATION'] = '1'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def data_generator(notebook_path, output_csv_path, executions):\n",
    "\n",
    "    exception_count = 0\n",
    "    num_correct = 0\n",
    "    iterations = 0\n",
    "\n",
    "    seen_questions = {}\n",
    "\n",
    "    with open(output_csv_path, 'w', newline='', encoding='utf-8') as csvfile:\n",
    "        writer = csv.writer(csvfile)\n",
    "        # Write header only once, at the beginning\n",
    "        writer.writerow([\"question\", \"solution\", \"question_type\", \"answer_type\",\\\n",
    "            \"extracted_answer\",\\\n",
    "            \"small_eval_point\", \"small_analytical\", \"small_numerical\",\\\n",
    "            \"large_eval_point\", \"large_analytical\", \"large_numerical\"])\n",
    "    \n",
    "    while num_correct < executions:\n",
    "        iterations += 1\n",
    "        try:\n",
    "            with open(notebook_path) as f:\n",
    "                nb = nbformat.read(f, as_version=4)\n",
    "                ep = ExecutePreprocessor(timeout=10, kernel_name='python3')\n",
    "                ep.preprocess(nb, {'metadata': {'path': os.path.dirname(notebook_path)}})\n",
    "\n",
    "                problem_cell = nb.cells[-3]\n",
    "                problem_output = problem_cell['outputs'][0]['text'] if problem_cell['outputs'] else \"No Problem Output\"\n",
    "\n",
    "                if problem_output in seen_questions:\n",
    "                    raise ValueError(\"Duplicate problem detected.\")\n",
    "                else:\n",
    "                    seen_questions[problem_output] = True\n",
    "                \n",
    "                solution_cell = nb.cells[-1]\n",
    "                solution_output = solution_cell['outputs'][0]['text'] if solution_cell['outputs'] else \"No Solution Output\"\n",
    "\n",
    "                problem_type = \"ODE\"\n",
    "\n",
    "                solution_type = \"list\"\n",
    "\n",
    "                small_x_eval_point_output = 0.1\n",
    "\n",
    "                both_solutions_cell = nb.cells[-5]\n",
    "                both_solutions_output = both_solutions_cell['outputs'][0]['text'] if both_solutions_cell['outputs'] else \"No Both Solutions\"\n",
    "\n",
    "                large_solution_cell = nb.cells[-7]\n",
    "                large_solution_output = large_solution_cell['outputs'][0]['text'] if large_solution_cell['outputs'] else \"No Small Solution\"\n",
    "                \n",
    "                small_solution_cell = nb.cells[-9]\n",
    "                small_solution_output = small_solution_cell['outputs'][0]['text'] if small_solution_cell['outputs'] else \"No Large Solution\"\n",
    "\n",
    "                small_x_approx_solution_cell = nb.cells[-17]\n",
    "                small_x_approx_solution_output = small_x_approx_solution_cell['outputs'][0]['text'] if small_x_approx_solution_cell['outputs'] else \"No small x approx Solution\"\n",
    "\n",
    "                large_x_approx_solution_cell = nb.cells[-15]\n",
    "                large_x_approx_solution_output = large_x_approx_solution_cell['outputs'][0]['text'] if large_x_approx_solution_cell['outputs'] else \"No Large x approx Solution\"\n",
    "\n",
    "                small_x_num_solution_cell = nb.cells[-13]\n",
    "                small_x_num_solution_output = small_x_num_solution_cell['outputs'][0]['text'] if small_x_num_solution_cell['outputs'] else \"No small x numerical Solution\"\n",
    "\n",
    "                large_x_num_solution_cell = nb.cells[-11]\n",
    "                large_x_num_solution_output = large_x_num_solution_cell['outputs'][0]['text'] if large_x_num_solution_cell['outputs'] else \"No Large x numerical Solution\"\n",
    "\n",
    "                large_x_eval_point_cell = nb.cells[-19]\n",
    "                large_x_eval_point_output = large_x_eval_point_cell['outputs'][0]['text'] if large_x_eval_point_cell['outputs'] else \"No large x eval point\"\n",
    "\n",
    "                # Writing/Appending to the CSV\n",
    "                with open(output_csv_path, 'a', newline='', encoding='utf-8') as csvfile:\n",
    "                    writer = csv.writer(csvfile)\n",
    "                    writer.writerow([problem_output, solution_output, problem_type, solution_type,\\\n",
    "                        both_solutions_output,\n",
    "                        small_x_eval_point_output, small_x_approx_solution_output, small_x_num_solution_output,\\\n",
    "                        large_x_eval_point_output, large_x_approx_solution_output, large_x_num_solution_output])\n",
    "\n",
    "            num_correct += 1\n",
    "            print(f\"num_correct: {num_correct}\")\n",
    "                                \n",
    "        except Exception as e:\n",
    "            exception_count += 1\n",
    "            print(f'Error during iteration {iterations}')\n",
    "            continue  # Skip the rest of this loop iteration and continue with the next\n",
    "\n",
    "        print(f'Execution {num_correct}/{iterations} completed and output appended to CSV.')\n",
    "        print(f'CSV file has been updated at: {os.path.abspath(output_csv_path)}')\n",
    "    print(f\"There were {num_correct}/{iterations} successes.\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "notebook_path = \"ODE_solver.ipynb\"\n",
    "output_csv_path = 'ODE_train_dataset.csv'\n",
    "data_generator(notebook_path, output_csv_path, 150)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "cs229_1",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
