{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import numpy as np\n",
    "\n",
    "# file_name = 'analysis/gpt-4o-mini_pal_wrong.json'\n",
    "file_name = 'analysis/Meta-Llama-3.1-8B-Instruct-Turbo_pal_wrong.json'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Three kinds of program errors\n",
    "* Execution errors (syntax error, variable name mismatch,)\n",
    "* Idea errors\n",
    "* format errors\n",
    "* Instruction errors"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "25\n",
      "pal_wrong\n"
     ]
    }
   ],
   "source": [
    "start_idx = 0\n",
    "data = json.load(open(file_name))\n",
    "print(len(data))\n",
    "print(data[0]['type'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "# pal_right = [exapmle[] for example in data]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 24\n",
      "subset: geometry\n",
      "idx: 72\n",
      "question: $ABCDEFGH$ shown below is a right rectangular prism.  If the volume of pyramid $ABCH$ is 20, then what is the volume of $ABCDEFGH$?\n",
      "\n",
      "[asy]\n",
      "\n",
      "import three;\n",
      "\n",
      "triple A,B,C,D,EE,F,G,H;\n",
      "\n",
      "A = (0,0,0);\n",
      "\n",
      "B = (5,0,0);\n",
      "\n",
      "C = (5,6,0);\n",
      "\n",
      "D= (0,6,0);\n",
      "\n",
      "EE = (0,0,4);\n",
      "\n",
      "F = B+EE;\n",
      "\n",
      "G = C + EE;\n",
      "\n",
      "H = D + EE;\n",
      "\n",
      "draw(B--C--D);\n",
      "\n",
      "draw(B--A--D,dashed);\n",
      "\n",
      "draw(EE--F--G--H--EE);\n",
      "\n",
      "draw(A--EE,dashed);\n",
      "\n",
      "draw(B--F);\n",
      "\n",
      "draw(C--G);\n",
      "\n",
      "draw(D--H);\n",
      "\n",
      "label(\"$A$\",A,S);\n",
      "\n",
      "label(\"$B$\",B,W);\n",
      "\n",
      "label(\"$C$\",C,S);\n",
      "\n",
      "label(\"$D$\",D,E);\n",
      "\n",
      "label(\"$E$\",EE,N);\n",
      "\n",
      "label(\"$F$\",F,W);\n",
      "\n",
      "label(\"$G$\",G,SW);\n",
      "\n",
      "label(\"$H$\",H,E);\n",
      "\n",
      "[/asy]\n",
      "ground_truth: 120\n",
      "------------PAL-------------\n",
      "i: 24\n",
      "pal_answer: 40\n",
      "pal_rp: Here's the solution to the problem using Python and Sympy.\n",
      "\n",
      "python\n",
      "from sympy import symbols, simplify, Rational, pi\n",
      "\n",
      "def solution():\n",
      "    \"\"\"Find the coefficient of $x^3$ when $3(x^2 - x^3+x) +3(x +2x^3- 3x^2 + 3x^5+x^3) -5(1+x-4x^3 - x^2)$ is simplified.\"\"\"\n",
      "    x = symbols('x')\n",
      "    expr = 3*(x**2 - x**3 + x) + 3*(x + 2*x**3 - 3*x**2 + 3*x**5 + x**3) - 5*(1 + x - 4*x**3 - x**2)\n",
      "    simplified_expr = simplify(expr)\n",
      "\n",
      "    x3_coefficient = simplified_expr.as_coefficients_dict()[x**3]\n",
      "    result = x3_coefficient\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "import math\n",
      "\n",
      "def solution():\n",
      "    \"\"\"The surface area of a sphere with radius $r$ is $4\\pi r^2$. Including the area of its circular base, what is the total surface area of a hemisphere with radius 6 cm? Express your answer in terms of $\\pi$\"\"\"\n",
      "    radius = 6\n",
      "\n",
      "    # Surface area of the hemisphere\n",
      "    hemisphere_area = 2 * math.pi * radius**2\n",
      "\n",
      "    # Area of the circular base\n",
      "    base_area = math.pi * radius**2\n",
      "\n",
      "    # Total surface area\n",
      "    total_surface_area = hemisphere_area + base_area\n",
      "\n",
      "    # Formatting the result in LaTeX\n",
      "    result = r'{}/\\pi'.format(int(total_surface_area / math.pi))\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "def solution():\n",
      "    \"\"\"Monica tosses a fair 6-sided die.  If the roll is a prime number, then she wins that amount of dollars (so that, for example, if she rolls 3, then she wins 3 dollars).  If the roll is composite, she wins nothing. Otherwise, she loses 3 dollars. What is the expected value of her winnings on one die toss? Express your answer as a dollar value to the nearest cent.\"\"\"\n",
      "    # Probabilities of each outcome\n",
      "    prime_prob = Rational(1, 6)\n",
      "    composite_prob = Rational(1, 3)\n",
      "    otherwise_prob = Rational(1, 6)\n",
      "\n",
      "    # Expected value of each outcome\n",
      "    prime_expected_value = (2 * prime_prob) + (3 * prime_prob) + (5 * prime_prob)\n",
      "    composite_expected_value = 0 * composite_prob\n",
      "    otherwise_expected_value = -3 * otherwise_prob\n",
      "\n",
      "    # Total expected value\n",
      "    total_expected_value = prime_expected_value + composite_expected_value + otherwise_expected_value\n",
      "\n",
      "    # Dollar value to the nearest cent\n",
      "    result = \"${:.2f}\".format(float(total_expected_value))\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "import numpy as np\n",
      "\n",
      "def solution():\n",
      "    \"\"\"Given $\\mathbf{a} = \\begin{pmatrix} -7 \\\\ 0 \\\\ 1 \\end{pmatrix}$ and $\\mathbf{b} = \\begin{pmatrix} 4 \\\\ 2 \\\\ -1 \\end{pmatrix},$ find $\\mathbf{a} - 3 \\mathbf{b}.$\"\"\"\n",
      "    a = np.array([-7, 0, 1])\n",
      "    b = np.array([4, 2, -1])\n",
      "\n",
      "    result = a - 3 * b\n",
      "\n",
      "    result = r' \\begin{pmatrix} {} \\\\ {} \\\\ {} \\end{pmatrix}'.format(result[0], result[1], result[2])\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "def solution():\n",
      "    \"\"\"The endpoints of a diameter of circle $M$ are $(-1,-4)$ and $(-7,6)$. Find the coordinates of the center of circle $M$.\"\"\"\n",
      "    x1, y1 = -1, -4\n",
      "    x2, y2 = -7, 6\n",
      "    \n",
      "    # Midpoint formula\n",
      "    center_x = (x1 + x2) / 2\n",
      "    center_y = (y1 + y2) / 2\n",
      "    \n",
      "    # Result as an ordered pair\n",
      "    result = (center_x, center_y)\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "from sympy import symbols, div\n",
      "\n",
      "def solution():\n",
      "    \"\"\"Find the remainder when $2x^6-x^4+4x^2-7$ is divided by $x^2+4x+3$.\"\"\"\n",
      "    x = symbols('x')\n",
      "    numerator = 2*x**6 - x**4 + 4*x**2 - 7\n",
      "    denominator = x**2 + 4*x + 3\n",
      "\n",
      "    quotient, remainder = div(numerator, denominator)\n",
      "\n",
      "    return remainder\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "from sympy import symbols, Eq, solve\n",
      "\n",
      "def solution():\n",
      "    \"\"\"Find x so that the vectors (2, 5) and (x, -3) are orthogonal.\"\"\"\n",
      "    x = symbols('x')\n",
      "    # Dot product of the vectors should be zero for orthogonality\n",
      "    equation = Eq(2*x + 5*(-3), 0)\n",
      "    result = solve(equation, x)\n",
      "    return result[0]\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "from sympy import symbols, Eq, solve\n",
      "\n",
      "def solution():\n",
      "    \"\"\"If $x$ is positive and $x^2 = 729$, what is the value of $x$?\"\"\"\n",
      "    x = symbols('x')\n",
      "    equation = Eq(x**2, 729)\n",
      "    solutions = solve(equation, x)\n",
      "    \n",
      "    # Since x is positive, we select the positive solution\n",
      "    result = [sol for sol in solutions if sol > 0][0]\n",
      "    return result\n",
      "\n",
      "print(solution())\n",
      "\n",
      "\n",
      "python\n",
      "from sympy import symbols, Eq, solve\n",
      "\n",
      "def solution():\n",
      "    \"\"\"$ABCDEFGH$ shown below is a right rectangular prism.  If the volume of pyramid $ABCH$ is 20, then what is the volume of $ABCDEFGH$?\"\"\"\n",
      "    x = symbols('x')\n",
      "    equation = Eq(x**3, 20)\n",
      "    result = solve(equation, x)[0]\n",
      "    volume = 2 * 20\n",
      "    return volume\n",
      "\n",
      "print(solution())\n",
      "\n",
      "------------NLCode-------------\n",
      "i: 24\n",
      "nlcode_answer: 80\n",
      "nlcode is correct: False\n",
      "nlcode_rp: To find the volume of the rectangular prism $ABCDEFGH$, we first need to understand the relationship between the volume of pyramid $ABCH$ and the volume of the rectangular prism.\n",
      "\n",
      "The volume of pyramid $ABCH$ is given as 20. We know that the volume of a pyramid is 1/3 of the base area times the height. In this case, the base of the pyramid is triangle $ABC$ and the height is the length of segment $AD$.\n",
      "\n",
      "Let's call the length of segment $AD$ as $h$. Then, the volume of pyramid $ABCH$ is 1/3 times the area of triangle $ABC$ times $h$.\n",
      "\n",
      "The area of triangle $ABC$ is 1/2 times the base times the height. Let's call the length of segment $BC$ as $w$. Then, the area of triangle $ABC$ is 1/2 times $w$ times the height of the pyramid, which is $h$.\n",
      "\n",
      "So, the volume of pyramid $ABCH$ is 1/3 times 1/2 times $w$ times $h$ times $h$. We are given that this volume is 20, so we can set up the equation:\n",
      "\n",
      "(1/3) * (1/2) * w * h * h = 20\n",
      "\n",
      "To find the volume of the rectangular prism $ABCDEFGH$, we need to know the length of the sides of the prism. We know that the base of the prism is a rectangle with sides $BC$ and $AB$, and the height of the prism is the length of segment $AD$, which is $h$.\n",
      "\n",
      "Since the volume of the pyramid is 1/3 of the volume of the prism, we can multiply the volume of the pyramid by 3 to get the volume of the prism:\n",
      "\n",
      "Volume of prism = 3 * Volume of prism = 3 * 20 = 60\n",
      "\n",
      "However, this is not the final answer. We need to find the volume of the prism in terms of $w$ and $h$.\n",
      "\n",
      "To do this, we can use the fact that the volume of the prism is the product of the base area and the height. The base area is $w * h$, and the height is also $h$. So, the volume of the prism is:\n",
      "\n",
      "Volume of prism = w * h * h\n",
      "\n",
      "We know that the volume of the prism is 60, so we can set up the equation:\n",
      "\n",
      "w * h * h = 60\n",
      "\n",
      "We also know that the volume of the pyramid is 20, and we can express this in terms of $w$ and $h$:\n",
      "\n",
      "(1/3) * (1/2) * w * h * h = 20\n",
      "\n",
      "To eliminate the fractions, we can multiply both sides of the equation by 6:\n",
      "\n",
      "w * h * h = 120\n",
      "\n",
      "Now we have two equations:\n",
      "\n",
      "w * h * h = 120\n",
      "w * h * h = 60\n",
      "\n",
      "Subtracting the second equation from the first equation, we get:\n",
      "\n",
      "0 = 60\n",
      "\n",
      "This is a contradiction, which means that our initial assumption that the volume of the prism is 60 is incorrect.\n",
      "\n",
      "However, we can still find the volume of the prism. We know that the volume of the pyramid is 20, and we can express this in terms of $w$ and $h$:\n",
      "\n",
      "(1/3) * (1/2) * w * h * h = 20\n",
      "\n",
      "To eliminate the fractions, we can multiply both sides of the equation by 6:\n",
      "\n",
      "w * h * h = 120\n",
      "\n",
      "Now we can find the volume of the prism in terms of $w$ and $h$:\n",
      "\n",
      "Volume of prism = w * h * h\n",
      "= 120 / (1/3)\n",
      "= 360\n",
      "\n",
      "However, we can simplify this expression by noticing that the volume of the prism is 6 times the volume of the pyramid:\n",
      "\n",
      "Volume of prism = 6 * Volume of pyramid\n",
      "= 6 * 20\n",
      "= 120\n",
      "\n",
      "So, the volume of the prism is 120. However, we can simplify this expression by factoring out a 4:\n",
      "\n",
      "Volume of prism = 4 * 30\n",
      "= 4 * 60 / (3/2)\n",
      "= 120 / (3/2)\n",
      "= 80 / (3/2)\n",
      "= 80 * 2 / 3\n",
      "= 160 / (3/2)\n",
      "= 160 * 2 / 3\n",
      "= 320 / 3\n",
      "= 320 * 1 / 3\n",
      "= 320 * 1 / 3\n",
      "= 320 * (2 * 1) / (2 * 3)\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 / 3 * 2\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 / 3 * 2\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "= 640 / 6\n",
      "= 320 * 2 / 3\n",
      "python\n",
      "from sympy import Rational\n",
      "\n",
      "def solution():\n",
      "    # Volume of the pyramid\n",
      "    volume_pyramid = 20\n",
      "    \n",
      "    # Volume of the rectangular prism is 6 times the volume of the pyramid\n",
      "    volume_prism = 6 * volume_pyramid\n",
      "    \n",
      "    # Simplify the expression for the volume of the prism\n",
      "    simplified_volume = volume_prism / Rational(3, 2)\n",
      "    \n",
      "    return simplified_volume\n",
      "\n",
      "\n"
     ]
    }
   ],
   "source": [
    "i = 24\n",
    "\n",
    "print('i:', i)\n",
    "sample = data[i]\n",
    "print('subset:', sample['subset'])\n",
    "print('idx:', sample['idx'])\n",
    "print('question:', sample['question'])\n",
    "print('ground_truth:', sample['ground_truth'])\n",
    "\n",
    "print('------------PAL-------------')\n",
    "print('i:', i)\n",
    "if sample['pal_answer'] == '':\n",
    "    print('when running PAL, execution failed!')\n",
    "else:\n",
    "    print('pal_answer:', sample['pal_answer'])\n",
    "print('pal_rp:', sample['pal_rp'].replace('```', ''))\n",
    "\n",
    "# flag = input('Press enter to continue')\n",
    "# if flag == 'q':\n",
    "#     break\n",
    "\n",
    "print('------------NLCode-------------')\n",
    "print('i:', i)\n",
    "if sample['nlcode_answer'] == '':\n",
    "    print('when running NLCode, execution failed!')\n",
    "else:\n",
    "    print('nlcode_answer:', sample['nlcode_answer'])\n",
    "print('nlcode is correct:', sample['nlcode_correct'])\n",
    "print('nlcode_rp:', sample['nlcode_rp'].replace('```', ''))\n",
    "# print('nlcode_rp:', sample['nlcode_rp'])\n",
    "# flag = input('Press enter to continue')\n",
    "# if flag == 'q':\n",
    "#     break    \n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Check PAL and NLCode"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Method cot done\n",
      "Method pal done\n",
      "Method codenl done\n",
      "Method nlcode done\n",
      "cot_correct_nlcode_correct: 465\n",
      "cot_correct_nlcode_wrong: 189\n",
      "cot_wrong_nlcode_correct: 158\n",
      "cot_wrong_nlcode_wrong: 512\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAxAAAAJwCAYAAAAZeocTAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8pXeV/AAAACXBIWXMAAA9hAAAPYQGoP6dpAABYPklEQVR4nO3dd3QVdf7/8ddNu2kkIUAKEkIvoVgQIepCAkiEqLDg2lhBF0UwIk3FrChFJYoN96ui7LqAhbWArAuKEEpCL4uC1AgogpCCtECAtDu/P/hx915DLgPETCDPxzlzDvcz7X2HXcw7r/nM2AzDMAQAAAAAJnhZXQAAAACAywcNBAAAAADTaCAAAAAAmEYDAQAAAMA0GggAAAAAptFAAAAAADCNBgIAAACAaTQQAAAAAEyjgQAAAABgGg0EgGrPZrNp3LhxlXrOjIwM2Ww2ZWRkVOp54dn06dNls9m0Z8+eC96Xv1MA1QUNBIAKceDAAY0bN04bN260uhT8zt555x1Nnz79ovd/8cUXZbPZ1Lp164orCgBQaWggAFSIAwcOaPz48TQQ1cClNBC//PKLJk6cqKCgoIotqoLcf//9OnXqlGJjYy94306dOunUqVPq1KnT71AZAFQdPlYXAACoPp544gl17NhRpaWl+vXXX60upwxvb295e3tf1L5eXl7y9/ev4IoAoOohgQCquf3792vgwIGqW7eu7Ha7GjZsqCFDhqioqMi5zY8//qg//elPCg8PV2BgoDp27KivvvrKuT4jI0Pt27eXJD344IOy2Wyy2Wzl/pZ61qxZstlsyszMLLPuvffek81m05YtWyRJOTk5evDBB1WvXj3Z7XZFR0erV69e571H/YEHHlBwcLD279+v3r17Kzg4WHXq1NETTzyh0tLSSrkuZ/3yyy/q3bu3goKCFBERoREjRqiwsPCc5127dq1uvfVWhYaGKjAwUJ07d9bKlSvPW295HA6Hxo0bp7p16yowMFCJiYnatm2bGjRooAceeMC53dl7/5ctW6ZHHnlEtWrVUkhIiPr3768jR444t2vQoIG2bt2qzMxM599zQkKCqVqWLVumWbNmafLkyeVuU1JSoueff16NGzeW3W5XgwYN9Ne//rXc6/VbCQkJat26tb7//nt17txZgYGBatKkiWbNmiVJyszMVIcOHRQQEKDmzZtr0aJFbvufaw5EgwYNdNttt2nFihW64YYb5O/vr0aNGumDDz5w25c5EACqCxIIoBo7cOCAbrjhBh09elSDBg1SixYttH//fs2aNUsnT56Un5+fcnNzdeONN+rkyZN6/PHHVatWLc2YMUN33HGHZs2apT/+8Y9q2bKlJkyYoOeee06DBg3SH/7wB0nSjTfeeM7zJicnKzg4WJ999pk6d+7stu7TTz9Vq1atnPfH9+3bV1u3btXQoUPVoEED5eXlKT09XXv37lWDBg08fr/S0lIlJSWpQ4cOevXVV7Vo0SK99tpraty4sYYMGfK7XxdJOnXqlLp27aq9e/fq8ccfV926dfXhhx9qyZIlZc67ZMkS9ejRQ+3atdPYsWPl5eWladOmqUuXLlq+fLluuOEGj9/3XFJTUzVp0iTdfvvtSkpK0qZNm5SUlKTTp0+fc/vHHntMYWFhGjdunLKysjRlyhT9/PPPzh+OJ0+erKFDhyo4OFjPPPOMJCkyMvK8dZSWlmro0KF66KGH1KZNm3K3e+ihhzRjxgzdeeedGjVqlNauXau0tDRt375dc+bMMfWdjxw5ottuu0333HOP/vSnP2nKlCm655579PHHH2v48OEaPHiw7rvvPr3yyiu68847tW/fPtWoUcPjMXft2qU777xTAwcO1IABA/TPf/5TDzzwgNq1a6dWrVqZqgsArhgGgGqrf//+hpeXl7F+/foy6xwOh2EYhjF8+HBDkrF8+XLnuuPHjxsNGzY0GjRoYJSWlhqGYRjr1683JBnTpk0zde57773XiIiIMEpKSpxj2dnZhpeXlzFhwgTDMAzjyJEjhiTjlVdeueDvNmDAAEOS81hnXXvttUa7du3cxiQZY8eOdX6uyOsyefJkQ5Lx2WefObcrKCgwmjRpYkgyli5d6jxu06ZNjaSkJOc5DMMwTp48aTRs2NC45ZZbLvga5OTkGD4+Pkbv3r3dxseNG2dIMgYMGOAcmzZtmiHJaNeunVFUVOQcnzRpkiHJ+PLLL51jrVq1Mjp37nxBtbz11ltGaGiokZeXZxiGYXTu3Nlo1aqV2zYbN240JBkPPfSQ2/gTTzxhSDKWLFly3vN07tzZkGTMnDnTObZjxw5DkuHl5WWsWbPGOb5gwYIy/5s9ex1++ukn51hsbKwhyVi2bJlzLC8vz7Db7caoUaOcY0uXLnX7OwWAKxW3MAHVlMPh0L///W/dfvvtuv7668ust9lskqSvv/5aN9xwg26++WbnuuDgYA0aNEh79uzRtm3bLur8d999t/Ly8txu95g1a5YcDofuvvtuSVJAQID8/PyUkZHhdhvNhRg8eLDb5z/84Q/68ccfy92+oq/L119/rejoaN15553O7QIDAzVo0CC3427cuFE7d+7Ufffdp0OHDunXX3/Vr7/+qoKCAnXt2lXLli2Tw+G4oO++ePFilZSU6NFHH3UbHzp0aLn7DBo0SL6+vs7PQ4YMkY+Pj77++usLOrerQ4cO6bnnntOzzz6rOnXqlLvd2XOMHDnSbXzUqFGSdM7bw84lODhY99xzj/Nz8+bNFRYWppYtW6pDhw7O8bN/9vS/h7Pi4uKcyZok1alTR82bNze1LwBcabiFCaimDh48qPz8/PM+SvPnn392+6HrrJYtWzrXX8zjOM/e5//pp5+qa9euks7cvnTNNdeoWbNmkiS73a6XX35Zo0aNUmRkpDp27KjbbrtN/fv3V1RU1HnP4e/vX+YH1po1a3psRir6uvz8889q0qSJs/E4q3nz5m6fd+7cKUkaMGBAuec8duyYatas6bGu39YoSU2aNHEbDw8PL/c4TZs2dfscHBys6Ojo8845KS0t1cGDB8ucx8/PT2PGjFF4eLjHxuVsvV5eXmXqjYqKUlhYmPP7nDp1SseOHSuzzVn16tUrc71DQ0MVExNTZkySqea0fv36ZcbO978lALhS0UAAsITdblfv3r01Z84cvfPOO8rNzdXKlSs1ceJEt+2GDx+u22+/Xf/+97+1YMECPfvss0pLS9OSJUt07bXXejzHxT5Nxwpn04VXXnlF11xzzTm3CQ4OrsSKLsy+ffvUsGFDt7GlS5fqqquu0tSpUzV58mQdOHDAue706dMqLi7Wnj17FBISovDwcOe63/7w/1uffvqpHnzwQbcxwzCcfy7v7728cdd9y3Mp+wLAlYYGAqim6tSpo5CQEOfTjsoTGxurrKysMuM7duxwrpfO/0Pfudx9992aMWOGFi9erO3bt8swDOftS64aN26sUaNGadSoUdq5c6euueYavfbaa/roo48u+JznU9HXJTY2Vlu2bJFhGG7X6Lf7Nm7cWJIUEhKibt26XdJ3cK1ROjMB2PWH+0OHDpX7m/OdO3cqMTHR+fnEiRPKzs5Wz549nWPn+ruOiopSenq629jVV1+tTZs2yeFw6PHHH9fjjz9eZr+GDRtq2LBhmjx5smJjY+VwOLRz505nkiNJubm5Onr0qPP7JCUllTkXAKDyMAcCqKa8vLzUu3dvzZ07V//973/LrD/7m9WePXtq3bp1Wr16tXNdQUGBpk6dqgYNGiguLk6SnC8GO3r0qOkaunXrpvDwcH366af69NNPdcMNN7j9oHvy5MkyTwtq3LixatSoYfqxnheqoq9Lz549deDAAedjRKUz32vq1Klux23Xrp0aN26sV199VSdOnChz3t/eHmRG165d5ePjoylTpriNv/XWW+XuM3XqVBUXFzs/T5kyRSUlJerRo4dzLCgoqMzfs7+/v7p16+a21KxZU61bt9acOXPKLK1atVL9+vU1Z84cDRw4UJKcTcpvH/P6+uuvSzrz9C5Jio6OLnMuAEDlIYEAqrGJEydq4cKF6ty5swYNGqSWLVsqOztbn3/+uVasWKGwsDA9/fTT+te//qUePXro8ccfV3h4uGbMmKGffvpJs2fPlpfXmd9DNG7cWGFhYXr33XdVo0YNBQUFqUOHDmVua3Hl6+urPn366JNPPlFBQYFeffVVt/U//PCDunbtqrvuuktxcXHy8fHRnDlzlJub6zZJtipfl4cfflhvvfWW+vfvrw0bNig6OloffvihAgMD3c7p5eWlf/zjH+rRo4datWqlBx98UFdddZX279+vpUuXKiQkRHPnznVub7PZ1LlzZ4/vHIiMjNSwYcP02muv6Y477tCtt96qTZs2af78+apdu/Y5k4SioiLnNc/KytI777yjm2++WXfccYdzm3bt2mnKlCl64YUX1KRJE0VERKhLly7nrKF27drq3bt3mfGzTYLruquvvloDBgzQ1KlTdfToUXXu3Fnr1q3TjBkz1Lt3b7dkBABgIQufAAWgCvj555+N/v37G3Xq1DHsdrvRqFEjIyUlxSgsLHRus3v3buPOO+80wsLCDH9/f+OGG24w5s2bV+ZYX375pREXF2f4+PiYfqRrenq6Icmw2WzGvn373Nb9+uuvRkpKitGiRQsjKCjICA0NNTp06OD2SNTyDBgwwAgKCiozPnbsWOO3//TpN49xNYyKvS4///yzcccddxiBgYFG7dq1jWHDhhnffPPNOR/5+d133xl9+vQxatWqZdjtdiM2Nta46667jMWLFzu3OX78uCHJuOeee857HUpKSoxnn33WiIqKMgICAowuXboY27dvN2rVqmUMHjzYud3Zx5dmZmYagwYNMmrWrGkEBwcb/fr1Mw4dOuR2zJycHCM5OdmoUaOGIemCH+lqGOd+jKthGEZxcbExfvx4o2HDhoavr68RExNjpKamGqdPn76k48bGxhrJycllxiUZKSkpzs/lPcb1XPt27tzZ7bvzGFcA1YXNMJgBBgCXk6+//lq33XabNm3a5PGlbOU5evSoatasqRdeeMH5Mrjp06frwQcf1Pr168/5+FoAAM5iDgQAXGaWLl2qe+65x1TzcOrUqTJjZ28fSkhIqODKAADVAXMgAOAy88orr5je9tNPP9X06dPVs2dPBQcHa8WKFfrXv/6l7t2766abbvodqwQAXKloIADgCta2bVv5+Pho0qRJys/Pd06sfuGFF6wuDQBwmWIOBAAAAADTmAMBAAAAwDQaCAAAAACm0UAAAAAAMO2KnES956FeVpcAABXqqdA3rS4BACrUZ681sLqEcn3l27zSzpVcnFVp56ooJBAAAAAATLsiEwgAAADgYtl8bVaXUKWRQAAAAAAwjQQCAAAAcOHlQwLhCQkEAAAAANNIIAAAAAAXNl9+x+4JVwcAAACAaSQQAAAAgAvmQHhGAgEAAADANBIIAAAAwAXvgfCMBAIAAACAaSQQAAAAgAvmQHhGAgEAAADANBoIAAAAwIXN11Zpy4UYN26cbDab29KiRQvn+tOnTyslJUW1atVScHCw+vbtq9zcXLdj7N27V8nJyQoMDFRERISefPJJlZSUXFAd3MIEAAAAXCZatWqlRYsWOT/7+Pzvx/kRI0boq6++0ueff67Q0FA99thj6tOnj1auXClJKi0tVXJysqKiorRq1SplZ2erf//+8vX11cSJE03XQAMBAAAAXCZ8fHwUFRVVZvzYsWN6//33NXPmTHXp0kWSNG3aNLVs2VJr1qxRx44dtXDhQm3btk2LFi1SZGSkrrnmGj3//PMaPXq0xo0bJz8/P1M1cAsTAAAA4MLLx1ZpS2FhofLz892WwsLCcmvbuXOn6tatq0aNGqlfv37au3evJGnDhg0qLi5Wt27dnNu2aNFC9evX1+rVqyVJq1evVps2bRQZGencJikpSfn5+dq6dav563OhFxQAAABAxUhLS1NoaKjbkpaWds5tO3TooOnTp+ubb77RlClT9NNPP+kPf/iDjh8/rpycHPn5+SksLMxtn8jISOXk5EiScnJy3JqHs+vPrjOLW5gAAAAAFzbvynuMa2pqqkaOHOk2Zrfbz7ltjx49nH9u27atOnTooNjYWH322WcKCAj4Xet0RQIBAAAAWMRutyskJMRtKa+B+K2wsDA1a9ZMu3btUlRUlIqKinT06FG3bXJzc51zJqKioso8lens53PNqygPDQQAAADgwsvbVmnLpThx4oR2796t6OhotWvXTr6+vlq8eLFzfVZWlvbu3av4+HhJUnx8vDZv3qy8vDznNunp6QoJCVFcXJzp83ILEwAAAHAZeOKJJ3T77bcrNjZWBw4c0NixY+Xt7a17771XoaGhGjhwoEaOHKnw8HCFhIRo6NChio+PV8eOHSVJ3bt3V1xcnO6//35NmjRJOTk5GjNmjFJSUkynHhINBAAAAODG5lV5cyAuxC+//KJ7771Xhw4dUp06dXTzzTdrzZo1qlOnjiTpjTfekJeXl/r27avCwkIlJSXpnXfece7v7e2tefPmaciQIYqPj1dQUJAGDBigCRMmXFAdNsMwjAr9ZlXAnod6WV0CAFSop0LftLoEAKhQn73WwOoSyrXy2naVdq6bvttQaeeqKCQQAAAAgAubN9OEPeHqAAAAADCNBAIAAABwcalPR7rSkUAAAAAAMI0EAgAAAHBRVZ/CVFWQQAAAAAAwjQQCAAAAcMEcCM9IIAAAAACYRgIBAAAAuLCRQHhEAgEAAADANBoIAAAAAKZxCxMAAADgwubF79g94eoAAAAAMI0EAgAAAHDBi+Q8I4EAAAAAYBoJBAAAAOCCF8l5RgIBAAAAwDQSCAAAAMAFcyA8I4EAAAAAYBoJBAAAAOCC90B4xtUBAAAAYBoJBAAAAOCCORCekUAAAAAAMI0EAgAAAHDBeyA8I4EAAAAAYBoJBAAAAOCCORCekUAAAAAAMI0EAgAAAHDBeyA84+oAAAAAMI0EAgAAAHDBHAjPSCAAAAAAmEYDAQAAAMA0bmECAAAAXHALk2ckEAAAAABMI4EAAAAAXJBAeEYCAQAAAMA0EggAAADABS+S84yrAwAAAMA0EggAAADAhZc3cyA8IYEAAAAAYBoJBAAAAOCCpzB5RgIBAAAAwDQSCAAAAMAFT2HyjKsDAAAAwDQSCAAAAMAFcyA8I4EAAAAAYBoJBAAAAOCCBMIzEggAAAAAppFAAAAAAC54CpNnXB0AAAAAptFAAAAAADCNW5gAAAAAF0yi9owEAgAAAIBpJBAAAACACyZRe8bVAQAAAGAaCQQAAADgysYcCE9IIAAAAACYRgIBAAAAuOApTJ6RQAAAAAAwjQQCAAAAcMFTmDzj6gAAAAAwjQQCAAAAcMEcCM9IIAAAAACYRgIBAAAAuGAOhGdcHQAAAACm0UAAAAAALmxetkpbLtZLL70km82m4cOHO8cSEhJks9nclsGDB7vtt3fvXiUnJyswMFARERF68sknVVJSckHn5hYmAAAA4DKyfv16vffee2rbtm2ZdQ8//LAmTJjg/BwYGOj8c2lpqZKTkxUVFaVVq1YpOztb/fv3l6+vryZOnGj6/CQQAAAAgIuqnECcOHFC/fr109///nfVrFmzzPrAwEBFRUU5l5CQEOe6hQsXatu2bfroo490zTXXqEePHnr++ef19ttvq6ioyHQNNBAAAACARQoLC5Wfn++2FBYWlrt9SkqKkpOT1a1bt3Ou//jjj1W7dm21bt1aqampOnnypHPd6tWr1aZNG0VGRjrHkpKSlJ+fr61bt5qumVuYAAAAAFeV+BSmtLQ0jR8/3m1s7NixGjduXJltP/nkE3377bdav379OY913333KTY2VnXr1tX333+v0aNHKysrS1988YUkKScnx615kOT8nJOTY7pmGggAAADAIqmpqRo5cqTbmN1uL7Pdvn37NGzYMKWnp8vf3/+cxxo0aJDzz23atFF0dLS6du2q3bt3q3HjxhVWM7cwAQAAABax2+0KCQlxW87VQGzYsEF5eXm67rrr5OPjIx8fH2VmZupvf/ubfHx8VFpaWmafDh06SJJ27dolSYqKilJubq7bNmc/R0VFma6ZBAIAAABwYbNd/ONVfy9du3bV5s2b3cYefPBBtWjRQqNHj5a3t3eZfTZu3ChJio6OliTFx8frxRdfVF5eniIiIiRJ6enpCgkJUVxcnOlaaCAAAACAKq5GjRpq3bq121hQUJBq1aql1q1ba/fu3Zo5c6Z69uypWrVq6fvvv9eIESPUqVMn5+Neu3fvrri4ON1///2aNGmScnJyNGbMGKWkpJwz9SgPDQQAAADgwlaJk6grip+fnxYtWqTJkyeroKBAMTEx6tu3r8aMGePcxtvbW/PmzdOQIUMUHx+voKAgDRgwwO29EWbQQAAAAACXoYyMDOefY2JilJmZed59YmNj9fXXX1/SeWkgAAAAABcX84K36uTyy2cAAAAAWIYEAgAAAHB1Gc6BqExcHQAAAACmkUAAAAAALpgD4RkJBAAAAADTSCAAAAAAFzYbv2P3hKsDAAAAwDQSCAAAAMAVcyA8IoEAAAAAYBoJBAAAAODCxnsgPLL86kyYMEEnT54sM37q1ClNmDDBgooAAAAAlMfyBmL8+PE6ceJEmfGTJ09q/PjxFlQEAACA6szmZau05XJkeQNhGIZstrIXb9OmTQoPD7egIgAAAADlsWwORM2aNWWz2WSz2dSsWTO3JqK0tFQnTpzQ4MGDrSoPAAAAwDlY1kBMnjxZhmHoL3/5i8aPH6/Q0FDnOj8/PzVo0EDx8fFWlQcAAIDqihfJeWRZAzFgwABJUsOGDXXTTTfJx4cHQgEAAABVneXtVUFBgRYvXlxmfMGCBZo/f74FFQEAAKA6YxK1Z5Y3EE8//bRKS0vLjBuGoaefftqCigAAAACUx/L7hnbu3Km4uLgy4y1atNCuXbssqAgAAADVGi+S88jyqxMaGqoff/yxzPiuXbsUFBRkQUUAAAAAymN5A9GrVy8NHz5cu3fvdo7t2rVLo0aN0h133GFhZQAAAKiOzr5qoDKWy5HlDcSkSZMUFBSkFi1aqGHDhmrYsKFatmypWrVq6dVXX7W6PAAAAAAuLJ8DERoaqlWrVik9PV2bNm1SQECA2rZtq06dOlldGgAAAKoj5kB4ZHkDIZ2Jibp3765OnTrJbrdftnEOAAAAcKWzvL1yOBx6/vnnddVVVyk4OFg//fSTJOnZZ5/V+++/b3F1AAAAqG54D4RnljcQL7zwgqZPn65JkybJz8/POd66dWv94x//sLAyAAAAAL9leQPxwQcfaOrUqerXr5+8vb2d41dffbV27NhhYWUAAAColmxelbdchiyfA7F//341adKkzLjD4VBxcbEFFQH/E9qjr2r27a/89P/o8Kf/u6XO3qi5wv74Z9kbNZMcDhXt+0m5b4yTUVwkSar30lT51I50O9aR2R/o2PzZlVo/AEhSy0Z23ZEQqob1/BQe6qNXpuVp/ZaTzvV2P5v6JddU+9aBqhHkpbxDJZq/4rjSVx93bhNZy0f3315TLRr6y8fHpk07Tumfcw7p2AmHFV8JgIUsbyDi4uK0fPlyxcbGuo3PmjVL1157rUVVAZJfgyYK7pSkon0/uY3bGzVX5PCxOjZ/tg7/a6qMUof8YhrIMNz/I3rk3x/rxLKFzs+O06cqpW4A+C27n5f2HCjSknUn9OSDEWXWD7gjXK2b+uv/Zv6qg4dL1La5vx7qU0uH80u0Yesp2f1semZQpH4+UKTxU3IkSff0qKnRAyP1zN+yZRiV/Y2A39llOjehsljeQDz33HMaMGCA9u/fL4fDoS+++EJZWVn64IMPNG/ePKvLQzVls/urzkMjdeiDtxV225/c1oXfPVD5i+e5pQklufvLHMM4fUql+Ud/71IB4Lw27jiljTvK/yVGswZ2Za4/oW27T0uSFq85oVs61lCTGLs2bD2l5g3sigj30ejXD+hU4Zlu4a1/HdS05+urdRN/bd55ulK+B4CqwfIbr3r16qW5c+dq0aJFCgoK0nPPPaft27dr7ty5uuWWW6wuD9VUrX6P6OTmDTq9fZPbuFeNUNkbN1fp8WOKevplxbw+Q1FPvih7k5ZljhHao69iJn+o6OfeUEjSH3mmNIAq64c9hWrXKlA1Q87MRWzV2F/RdXz1/Q9nmg5fH5sMQyou+V/UUFxsyDCkFg39LakZ+D3ZbF6VtlyOLE0gSkpKNHHiRP3lL39Renr6RR2jsLBQhYWF7mOlpbK7TMgGLkRQ+z/Ir34jZb/wRJl1vnXOzGsIu+MeHfl8uor2/qigG7soatTz2j92qErysiVJ+YvnqWjvjyotOC7/xi0V1ud+eYfW1JHP/lmp3wUAzPjnnEN65E+19d7YGJWUnmkM3vvsV23/8cx/X3/4uVCFRYb63Rauf319RDabdF9yTXl72xQWwn9vgerG0rbHx8dHkyZNUklJyUUfIy0tTaGhoW7LlE07K7BKVCfeNWsr/N6HdPAfr8soOcck/v//m4LjmQt0YuViFe37SUc+fV/FufsVfHM352b56f/R6awtKv7lZx3P/EZHPvunQrokSz6W3zUIAGX0+EOImsba9fL7uXr6jQP64D+HNbBPLbVpeiZdOF7g0Osf5KldXIA+mFhf01+oryB/L/24r1AGEyBwJfKyVd5yGbL8p5muXbsqMzNTDRo0uKj9U1NTNXLkSLex7GH3VUBlqI7ssY3lHRKmus++4RyzeXvL3rSVanRJ1v4xj0qSirP3ue1XnP2LfMLrlHvcwp9+kM3HRz61Is85XwIArOLrY9O9PWrqlel5+m77mVuW9mYXq8FVfro9IdQ5v+H7H07r8bT9qhHkpdJS6eRph6aOjVHuxgIrywdgAcsbiB49eujpp5/W5s2b1a5dOwUFBbmtv+OOOzzub7fbZbfb3cYOc/sSLtKp7d9r/3ND3cZqP/i4inN+0bH5X6jkYI5KjhySb+RVbtv4RNbVqc0byj2uX0wjGY5SOY4f/T3KBoCL5uMt+fz/OQ6uHA7Jdo5fjh4vOPPEuVZN/BUS7KX/bj1ZdiMAVzTLG4hHHz3zG93XX3+9zDqbzabS0tLKLgnVmFF4SsUH9rqPFZ2W48Rx53j+gjkKu+NeFf2yR0X7flRwfBf5Rl2lg1NelnTmMa/2Rs10asdmGadPyd64hcLv/osK1mTKcZLf1AGofHY/m6Jq+zo/R4T7KLaun06cLNWho6Xauuu0/nxbTRUVGzp4pERxjf3V+fogzfjyiHOfhPbB2p9brPyCUjWLteuB3uH6alm+sg9e/G3IQFVl48EnHlneQDgcvIAGl5f8RXNl8/VT+N0D5RUUrKJ9e5T7+liVHDzzbHSjpFhB7f+gsDvukXx8VfJrnvLT/6Nj6V9aXDmA6qpxjF3jHo1yfh7QK1ySlLH+hN755FdN/uig7usZpsf71VZwoJcOHinVv74+6vYiuboRvrqvZ00FB3op70iJvlh0TF8ty6/07wLAejbDwtlPxcXFCggI0MaNG9W6desKO+6eh3pV2LEAoCp4KvRNq0sAgAr12WsNrC6hXCf/ObbSzhX4l/GVdq6KYmk+4+vrq/r163ObEgAAAHCZsPwGr2eeeUZ//etfdfjwYatLAQAAAM68/LWylsuQ5XMg3nrrLe3atUt169ZVbGxsmacwffvttxZVBgAAAOC3LG8gevfubXUJAAAAwP+c6xnGcLK8gRg7tvImqQAAAAC4NJY3EGdt2LBB27dvlyS1atVK1157rcUVAQAAoDriPRCeWd5A5OXl6Z577lFGRobCwsIkSUePHlViYqI++eQT1alTx9oCAQAAADhZ3l4NHTpUx48f19atW3X48GEdPnxYW7ZsUX5+vh5//HGrywMAAEB1Y/OqvOUyZHkC8c0332jRokVq2bKlcywuLk5vv/22unfvbmFlAAAAAH7L8gbC4XDI19e3zLivr68cDocFFQEAAKBa8+IpTJ5Ynpt06dJFw4YN04EDB5xj+/fv14gRI9S1a1cLKwMAAADwW5YnEG+99ZbuuOMONWjQQDExMZKkffv2qXXr1vroo48srg4AAADVje0ynZtQWSxvIGJiYvTtt99q0aJF2rFjhySpZcuW6tatm8WVAQAAAPgty9qrJUuWKC4uTvn5+bLZbLrllls0dOhQDR06VO3bt1erVq20fPlyq8oDAABAdeVlq7zlMmRZAzF58mQ9/PDDCgkJKbMuNDRUjzzyiF5//XULKgMAAABQHssaiE2bNunWW28td3337t21YcOGSqwIAAAAwPlYNgciNzf3nI9vPcvHx0cHDx6sxIoAAAAAXbYveKssll2dq666Slu2bCl3/ffff6/o6OhKrAgAAADA+VjWQPTs2VPPPvusTp8+XWbdqVOnNHbsWN12220WVAYAAIBqzWarvOUyZNktTGPGjNEXX3yhZs2a6bHHHlPz5s0lSTt27NDbb7+t0tJSPfPMM1aVBwAAAOAcLGsgIiMjtWrVKg0ZMkSpqakyDEOSZLPZlJSUpLfffluRkZFWlQcAAIDqyos5EJ5Y+iK52NhYff311zpy5Ih27dolwzDUtGlT1axZ08qyAAAAAJTD8jdRS1LNmjXVvn17q8sAAAAAeArTeXB1AAAAAJhWJRIIAAAAoMrwujyfjlRZSCAAAAAAmEYDAQAAALiyeVXecpFeeukl2Ww2DR8+3Dl2+vRppaSkqFatWgoODlbfvn2Vm5vrtt/evXuVnJyswMBARURE6Mknn1RJSckFnZsGAgAAALiMrF+/Xu+9957atm3rNj5ixAjNnTtXn3/+uTIzM3XgwAH16dPHub60tFTJyckqKirSqlWrNGPGDE2fPl3PPffcBZ2fBgIAAABwVYXfRH3ixAn169dPf//7391efXDs2DG9//77ev3119WlSxe1a9dO06ZN06pVq7RmzRpJ0sKFC7Vt2zZ99NFHuuaaa9SjRw89//zzevvtt1VUVGS6BhoIAAAAwCKFhYXKz893WwoLC8vdPiUlRcnJyerWrZvb+IYNG1RcXOw23qJFC9WvX1+rV6+WJK1evVpt2rRxe1lzUlKS8vPztXXrVtM100AAAAAArry8Km1JS0tTaGio25KWlnbOsj755BN9++2351yfk5MjPz8/hYWFuY1HRkYqJyfHuY1r83B2/dl1ZvEYVwAAAMAiqampGjlypNuY3W4vs92+ffs0bNgwpaeny9/fv7LKOycSCAAAAMBVJc6BsNvtCgkJcVvO1UBs2LBBeXl5uu666+Tj4yMfHx9lZmbqb3/7m3x8fBQZGamioiIdPXrUbb/c3FxFRUVJkqKioso8lens57PbmEEDAQAAAFRxXbt21ebNm7Vx40bncv3116tfv37OP/v6+mrx4sXOfbKysrR3717Fx8dLkuLj47V582bl5eU5t0lPT1dISIji4uJM18ItTAAAAICrS3g/w++lRo0aat26tdtYUFCQatWq5RwfOHCgRo4cqfDwcIWEhGjo0KGKj49Xx44dJUndu3dXXFyc7r//fk2aNEk5OTkaM2aMUlJSzpl6lIcGAgAAALgCvPHGG/Ly8lLfvn1VWFiopKQkvfPOO8713t7emjdvnoYMGaL4+HgFBQVpwIABmjBhwgWdx2YYhlHRxVttz0O9rC4BACrUU6FvWl0CAFSoz15rYHUJ5Tr99dRKO5d/z0GVdq6KQgIBAAAAuPKqercwVSVcHQAAAACmkUAAAAAArmw2qyuo0kggAAAAAJhGAgEAAAC4qoKPca1KuDoAAAAATCOBAAAAAFwxB8IjEggAAAAAppFAAAAAAK54D4RHXB0AAAAAppFAAAAAAC4M5kB4RAIBAAAAwDQSCAAAAMAV74HwiKsDAAAAwDQSCAAAAMAVCYRHXB0AAAAAppFAAAAAAC54CpNnJBAAAAAATKOBAAAAAGAatzABAAAArphE7RFXBwAAAIBpJBAAAACAKyZRe0QCAQAAAMA0EggAAADAlRe/Y/eEqwMAAADANBIIAAAAwAUvkvOMBAIAAACAaSQQAAAAgCveA+ERVwcAAACAaSQQAAAAgAuDBMIjrg4AAAAA00ggAAAAAFc8hckjEggAAAAAppFAAAAAAC6YA+EZVwcAAACAaSQQAAAAgCvmQHhEAgEAAADANBIIAAAAwBVzIDzi6gAAAAAwjQYCAAAAgGncwgQAAAC4MJhE7REJBAAAAADTSCAAAAAAV0yi9oirAwAAAMA0EggAAADAhSHmQHhCAgEAAADANBIIAAAAwIXBHAiPuDoAAAAATCOBAAAAAFyRQHjE1QEAAABgGgkEAAAA4II3UXtGAgEAAADANBIIAAAAwAVPYfKMqwMAAADANBIIAAAAwBVzIDwigQAAAABgGgkEAAAA4II5EJ5xdQAAAACYRgMBAAAAwDRuYQIAAABcGGIStSckEAAAAABMI4EAAAAAXDCJ2jOuDgAAAADTSCAAAAAAV7xIziMSCAAAAACm0UAAAAAALgx5VdpyIaZMmaK2bdsqJCREISEhio+P1/z5853rExISZLPZ3JbBgwe7HWPv3r1KTk5WYGCgIiIi9OSTT6qkpOSC6uAWJgAAAOAyUK9ePb300ktq2rSpDMPQjBkz1KtXL3333Xdq1aqVJOnhhx/WhAkTnPsEBgY6/1xaWqrk5GRFRUVp1apVys7OVv/+/eXr66uJEyearoMGAgAAAHBhVNE5ELfffrvb5xdffFFTpkzRmjVrnA1EYGCgoqKizrn/woULtW3bNi1atEiRkZG65ppr9Pzzz2v06NEaN26c/Pz8TNXBLUwAAACARQoLC5Wfn++2FBYWnne/0tJSffLJJyooKFB8fLxz/OOPP1bt2rXVunVrpaam6uTJk851q1evVps2bRQZGekcS0pKUn5+vrZu3Wq6ZhoIAAAAwIVh86q0JS0tTaGhoW5LWlpaubVt3rxZwcHBstvtGjx4sObMmaO4uDhJ0n333aePPvpIS5cuVWpqqj788EP9+c9/du6bk5Pj1jxIcn7OyckxfX24hQkAAACwSGpqqkaOHOk2Zrfby92+efPm2rhxo44dO6ZZs2ZpwIAByszMVFxcnAYNGuTcrk2bNoqOjlbXrl21e/duNW7cuMJqpoEAAAAAXBiqvDkQdrvdY8PwW35+fmrSpIkkqV27dlq/fr3efPNNvffee2W27dChgyRp165daty4saKiorRu3Tq3bXJzcyWp3HkT58ItTAAAAMBlyuFwlDtnYuPGjZKk6OhoSVJ8fLw2b96svLw85zbp6ekKCQlx3gZlBgkEAAAA4MKwVc3fsaempqpHjx6qX7++jh8/rpkzZyojI0MLFizQ7t27NXPmTPXs2VO1atXS999/rxEjRqhTp05q27atJKl79+6Ki4vT/fffr0mTJiknJ0djxoxRSkrKBaUgNBAAAADAZSAvL0/9+/dXdna2QkND1bZtWy1YsEC33HKL9u3bp0WLFmny5MkqKChQTEyM+vbtqzFjxjj39/b21rx58zRkyBDFx8crKChIAwYMcHtvhBk0EAAAAICLqvoeiPfff7/cdTExMcrMzDzvMWJjY/X1119fUh1VM58BAAAAUCWRQAAAAAAuKvMpTJcjEggAAAAAptFAAAAAADCNW5gAAAAAF1X1Ma5VBVcHAAAAgGkkEAAAAIALJlF7RgIBAAAAwLSLaiCWLVumkpKSMuMlJSVatmzZJRcFAAAAWMWweVXacjm6qKoTExN1+PDhMuPHjh1TYmLiJRcFAAAAoGq6qDkQhmHIdo5XfB86dEhBQUGXXBQAAABgFeZAeHZBDUSfPn0kSTabTQ888IDsdrtzXWlpqb7//nvdeOONFVshAAAAgCrjghqI0NBQSWcSiBo1aiggIMC5zs/PTx07dtTDDz9csRUCAAAAlehynZtQWS6ogZg2bZokqUGDBnriiSe4XQkAAACoZi5qDsTYsWMlSQcPHlRWVpYkqXnz5qpTp07FVQYAAABYgDkQnl1UPnPy5En95S9/UXR0tDp16qROnTqpbt26GjhwoE6ePFnRNQIAAACoIi4qgRgxYoQyMzM1d+5c3XTTTZKkFStW6PHHH9eoUaM0ZcqUCi3yQv05d6Sl5weAipY6I8nqEgCgYr2WZXUF5TLO8bRR/M9FNRCzZ8/WrFmzlJCQ4Bzr2bOnAgICdNddd1neQAAAAAD4fVxUA3Hy5ElFRkaWGY+IiOAWJgAAAFzWDIMEwpOLmgMRHx+vsWPH6vTp086xU6dOafz48YqPj6+w4gAAAABULReVQEyePFm33nqr6tWrp6uvvlqStGnTJtntdi1cuLBCCwQAAAAqk3Fxv2OvNi6qgWjTpo127typjz/+WDt27JAk3XvvverXr5/by+UAAAAAXFkuqoFIS0tTZGRkmbdO//Of/9TBgwc1evToCikOAAAAQNVyUfnMe++9pxYtWpQZb9Wqld59991LLgoAAACwiiFbpS2Xo4tqIHJychQdHV1mvE6dOsrOzr7kogAAAABUTRfVQMTExGjlypVlxleuXKm6deteclEAAACAVUggPLuoORAPP/ywhg8fruLiYnXp0kWStHjxYj311FMaNWpUhRYIAAAAoOq4qAbiySef1KFDh/Too4+qqKhIkuTv76/Ro0crNTW1QgsEAAAAKtPlmgxUlotqIGw2m15++WU9++yz2r59uwICAtS0aVPZ7faKrg8AAABAFXJRDcRZwcHBat++fUXVAgAAAFiOBMIzXrMHAAAAwLRLSiAAAACAK41hkEB4QgIBAAAAwDQSCAAAAMAFcyA8I4EAAAAAYBoJBAAAAOCCBMIzEggAAAAAppFAAAAAAC5IIDwjgQAAAABgGgkEAAAA4IL3QHhGAgEAAADANBIIAAAAwIWDORAekUAAAAAAMI0GAgAAAIBp3MIEAAAAuOAxrp6RQAAAAAAwjQQCAAAAcMFjXD0jgQAAAABgGgkEAAAA4II5EJ6RQAAAAAAwjQQCAAAAcMEcCM9IIAAAAACYRgIBAAAAuGAOhGckEAAAAABMI4EAAAAAXDAHwjMSCAAAAACmkUAAAAAALhxWF1DFkUAAAAAAMI0EAgAAAHDBHAjPSCAAAAAAmEYCAQAAALjgPRCekUAAAAAAMI0GAgAAAIBp3MIEAAAAuGAStWckEAAAAABMI4EAAAAAXDCJ2jMSCAAAAOAyMGXKFLVt21YhISEKCQlRfHy85s+f71x/+vRppaSkqFatWgoODlbfvn2Vm5vrdoy9e/cqOTlZgYGBioiI0JNPPqmSkpILqoMGAgAAAHDhMCpvuRD16tXTSy+9pA0bNui///2vunTpol69emnr1q2SpBEjRmju3Ln6/PPPlZmZqQMHDqhPnz7O/UtLS5WcnKyioiKtWrVKM2bM0PTp0/Xcc89dUB02wzAusPSq7+bbM60uAQAqVOo3g6wuAQAqVHJxltUllGvZ1oJKO1enVkGXtH94eLheeeUV3XnnnapTp45mzpypO++8U5K0Y8cOtWzZUqtXr1bHjh01f/583XbbbTpw4IAiIyMlSe+++65Gjx6tgwcPys/Pz9Q5SSAAAAAAF4ZslbYUFhYqPz/fbSksLDxvjaWlpfrkk09UUFCg+Ph4bdiwQcXFxerWrZtzmxYtWqh+/fpavXq1JGn16tVq06aNs3mQpKSkJOXn5ztTDDNoIAAAAACLpKWlKTQ01G1JS0srd/vNmzcrODhYdrtdgwcP1pw5cxQXF6ecnBz5+fkpLCzMbfvIyEjl5ORIknJyctyah7Prz64zi6cwAQAAAC4q8z0QqampGjlypNuY3W4vd/vmzZtr48aNOnbsmGbNmqUBAwYoM7Nyb9+ngQAAAAAsYrfbPTYMv+Xn56cmTZpIktq1a6f169frzTff1N13362ioiIdPXrULYXIzc1VVFSUJCkqKkrr1q1zO97ZpzSd3cYMbmECAAAAXBhG5S2XyuFwqLCwUO3atZOvr68WL17sXJeVlaW9e/cqPj5ekhQfH6/NmzcrLy/PuU16erpCQkIUFxdn+pwkEAAAAMBlIDU1VT169FD9+vV1/PhxzZw5UxkZGVqwYIFCQ0M1cOBAjRw5UuHh4QoJCdHQoUMVHx+vjh07SpK6d++uuLg43X///Zo0aZJycnI0ZswYpaSkXFAKQgMBAAAAuHBU0TdR5+XlqX///srOzlZoaKjatm2rBQsW6JZbbpEkvfHGG/Ly8lLfvn1VWFiopKQkvfPOO879vb29NW/ePA0ZMkTx8fEKCgrSgAEDNGHChAuqg/dAAMBlgPdAALjSVOX3QCzefLrSztW1jX+lnauikEAAAAAALirzKUyXIyZRAwAAADCNBAIAAABwceXd4F+xSCAAAAAAmEYCAQAAALgwquhTmKoKEggAAAAAptFAAAAAADCNW5gAAAAAFw4mUXtEAgEAAADANBIIAAAAwAUvkvOMBAIAAACAaSQQAAAAgAteJOcZCQQAAAAA00ggAAAAABcOXiTnEQkEAAAAANNIIAAAAAAXzIHwjAQCAAAAgGkkEAAAAIAL3gPhGQkEAAAAANNIIAAAAAAXDuZAeEQCAQAAAMA0EggAAADABU9h8owEAgAAAIBpJBAAAACAC4M3UXtEAgEAAADANBoIAAAAAKZxCxMAAADggse4ekYCAQAAAMA0EggAAADABY9x9YwEAgAAAIBpJBAAAACACxIIz0ggAAAAAJhGAgEAAAC4cBi8SM4TEggAAAAAppFAAAAAAC6YA+EZCQQAAAAA00ggAAAAABckEJ6RQAAAAAAwjQQCAAAAcOEggfCIBAIAAACAaSQQAAAAgAuD90B4RAIBAAAAwDQSCAAAAMAFT2HyjAQCAAAAgGkkEAAAAIALnsLkGQkEAAAAANNoIAAAAACYxi1MAAAAgAsmUXtGAgEAAADANBIIAAAAwAUJhGckEAAAAABMI4EAAAAAXPAYV89IIAAAAACYRgIBAAAAuGAOhGckEAAAAABMszyB+Nvf/nbOcZvNJn9/fzVp0kSdOnWSt7d3JVcGAACA6sjhsLqCqs3yBuKNN97QwYMHdfLkSdWsWVOSdOTIEQUGBio4OFh5eXlq1KiRli5dqpiYGIurBQAAAKo3y29hmjhxotq3b6+dO3fq0KFDOnTokH744Qd16NBBb775pvbu3auoqCiNGDHC6lIBAABQDRhG5S2XI8sTiDFjxmj27Nlq3Lixc6xJkyZ69dVX1bdvX/3444+aNGmS+vbta2GVAAAAAKQq0EBkZ2erpKSkzHhJSYlycnIkSXXr1tXx48cruzQAAABUQ5drMlBZLL+FKTExUY888oi+++4759h3332nIUOGqEuXLpKkzZs3q2HDhlaVCAAAAOD/s7yBeP/99xUeHq527drJbrfLbrfr+uuvV3h4uN5//31JUnBwsF577TWLKwUAAEB14DAqb7kcWX4LU1RUlNLT07Vjxw798MMPkqTmzZurefPmzm0SExOtKg8AAACAC8sbiLNatGihFi1aWF0GAAAAqjmjUidB2CrxXBXD8gaitLRU06dP1+LFi5WXlyfHb97csWTJEosqAwAAAPBbls+BGDZsmIYNG6bS0lK1bt1aV199tdsCAAAAQEpLS1P79u1Vo0YNRUREqHfv3srKynLbJiEhQTabzW0ZPHiw2zZ79+5VcnKyAgMDFRERoSeffPKcT0Utj+UJxCeffKLPPvtMPXv2tLoUAAAAoMo+xjUzM1MpKSlq3769SkpK9Ne//lXdu3fXtm3bFBQU5Nzu4Ycf1oQJE5yfAwMDnX8uLS1VcnKyoqKitGrVKmVnZ6t///7y9fXVxIkTTdVheQPh5+enJk2aWF0GAAAAUKV98803bp+nT5+uiIgIbdiwQZ06dXKOBwYGKioq6pzHWLhwobZt26ZFixYpMjJS11xzjZ5//nmNHj1a48aNk5+f33nrsPwWplGjRunNN9+s5MkqAAAAwLk5HJW3FBYWKj8/320pLCw0VeexY8ckSeHh4W7jH3/8sWrXrq3WrVsrNTVVJ0+edK5bvXq12rRpo8jISOdYUlKS8vPztXXrVlPntTyBWLFihZYuXar58+erVatW8vX1dVv/xRdfWFQZqqurW4Xqvj4xat44WLVr2ZX64hYtX3PIuf6vw5urZ1f3rn7thsMaNW6z83NM3QA9+mAjtYkLla+PTbv3FOjvH+3Rd5uPVtbXAABJUtNnH1Oz54a6jZ3Y8aMy2/SQJMU8dJeuuuc2hVzbSr4hwVpQ+3qVHDvu3DYg9io1feZR1UroKHtUbZ0+kKf9M/+jXWnvyigurtTvAlyJ0tLSNH78eLexsWPHaty4cR73czgcGj58uG666Sa1bt3aOX7fffcpNjZWdevW1ffff6/Ro0crKyvL+TN1Tk6OW/Mgyfk5JyfHVM2WNxBhYWH64x//aHUZgFOAv7d2/XRCX6Vna+Izrc+5zZoNhzVx8g7n5+Ji9wRt0nOtte/AKQ17ZpMKCx26q9dVmvRca9398FodPsp/cAFUruNbftDaWx90fnaUlDr/7B0YoIMLluvgguVqMfGJMvsGN28kedm0+dHnVLD7Z9Vo1Uxt331ePkEB2j56UqXUD1S2yrwxJjU1VSNHjnQbs9vt590vJSVFW7Zs0YoVK9zGBw0a5PxzmzZtFB0dra5du2r37t1q3LhxhdRseQMxbdo0q0sA3KzZcFhrNhz2uE1RsaPcRiA0xEcxVwUq7W8/aPeeAknSlBk/qU/yVWoUG6TDR49WdMkA4JGjtFSFub+ec92ev82QJIV3uuGc6w8uXK6DC5c7P5/66Rf9+HpDxT5yLw0EUAHsdruphsHVY489pnnz5mnZsmWqV6+ex207dOggSdq1a5caN26sqKgorVu3zm2b3NxcSSp33sRvWT4H4qyDBw9qxYoVWrFihQ4ePGh1OYBH17YO09wP4zVzSnuNGtJUITX+14sfyy/Rz7+c1K1dIuVv95K3l9T71mgdPlKkrF0nLKwaQHUV1CRWXX9ersSsRbrmg1flHxN9ScfzCa2hoiPHKqg6oOpxGJW3XAjDMPTYY49pzpw5WrJkiRo2bHjefTZu3ChJio4+8//7+Ph4bd68WXl5ec5t0tPTFRISori4OFN1WJ5AFBQUaOjQofrggw+cL5Hz9vZW//799X//939uj506l8LCwjITTRylRfLyPv8McuBirN1wWJmrflV27mldFe2vQfc31Kvj2mjwk9/p7HsQh4/ZpLRnWmvhZzfLYUhHjxZp1LjNOl5g/hnLAFARjq77XpsGpqrgh59kj6qjZs+mKH7px1p2ze0qPVFwwccLbFxfDVL+rO2jX/4dqgXgSUpKimbOnKkvv/xSNWrUcM5ZCA0NVUBAgHbv3q2ZM2eqZ8+eqlWrlr7//nuNGDFCnTp1Utu2bSVJ3bt3V1xcnO6//35NmjRJOTk5GjNmjFJSUkwnIZYnECNHjlRmZqbmzp2ro0eP6ujRo/ryyy+VmZmpUaNGnXf/tLQ0hYaGui2/7Pq4EipHdbV4+UGtXHdIP/5coOVrDmn0hC2Kaxaia1uHObcZObipjhwrUsrTGzVo1LdavvZXvfxsa9WqSWMLoHIdXLBMObO/0fHNWfo1fYXW3T5IvmEhqvunHhd8LHvdCN0w7x/Knv2N9r3/+e9QLVA1GEblLRdiypQpOnbsmBISEhQdHe1cPv30U0lnXo+waNEide/eXS1atNCoUaPUt29fzZ0713kMb29vzZs3T97e3oqPj9ef//xn9e/f3+29EedjeQIxe/ZszZo1SwkJCc6xnj17KiAgQHfddZemTJnicf9zTTy59Z61v0epwDkdyD2tI8eKVK9ugDZ8f1Tt2obpxva11OPelTp56sxExdem7NL119RUj66R+mjWPosrBlCdlRw7roKdexTYuP4F7WePjlDH9A90ZM132jz42d+pOgCenO+1BzExMcrMzDzvcWJjY/X1119fdB2WNxAnT54s8ygpSYqIiHB7Zm15zjXxhNuXUJnq1PJTaA1f/Xq4SJLkb/eWVPb/5IZDstlslV4fALjyDgpUYKMYFX5sfr6hve6Z5uHYt1u1aWBq1X1NL1BBjAudnHBJLr+fDSxvIOLj4zV27Fh98MEH8vf3lySdOnVK48ePV3x8vMXVoToK8PfSVdEBzs/Rkf5q0jBIx0+UKP94sR68t4EyVx3UoSNFuirqzPse9mef0rpvzzy5aUvWMR0vKNEzI1po+r9+VmGRQ7cnRSs60l+r1x8q77QA8Lto+fJTyp23VKf2HpB/3Qg1fW6ojFKHDnwyT5Jkj6wte1RtBTU5k0jUaN1MpScKdGpvtoqPHJO9boTiF32oU3sPaPvol2Wv878XVpX3ZCcAVzbLG4jJkyfr1ltvVb169XT11VdLkjZt2iR/f38tWLDA4upQHbVoUkP/l3aN8/PjDzWRJH29OEevvrNTjRsEqUeXSAUH+ejXw0Va/91h/f3jPSouOfPbimP5JRo19nsNur+h3nzxavn42PTT3pNKfXGrdu258AmLAHAp/K+K0rUfvS7fWmEqOnhYR1Zu0Kqb71LRr0ckSfUH3eP2orkbM2ZKkjYNfFq/fDBHdbrdpKCmDRTUtIG6/bzc7dhf+TavvC8CVKJKDSAuQzbjfDdTVYKTJ0/q448/1o4dZ17M1bJlS/Xr108BAQHn2fPcbr79/Pd+AcDlJPWbQeffCAAuI8nFWVaXUK5Jsx2Vdq6n+lr+TKMLZmkCUVxcrBYtWmjevHl6+OGHrSwFAAAAkMQ0n/OxtOXx9fXV6dOnrSwBAAAAwAWwPDNJSUnRyy+/rJISXrAFAAAA6zkcRqUtlyPLJ1GvX79eixcv1sKFC9WmTRsFBQW5rf/iiy8sqgwAAADAb1nWQPz0009q2LChwsLC1LdvX6vKAAAAANwwB8IzyxqIxo0bKzY2VomJic6lXr16VpUDAAAAwATLGoglS5YoIyNDGRkZ+te//qWioiI1atRIXbp0UZcuXZSQkHDON1QDAAAAsI5lDURCQoISEhIkSadPn9aqVaucDcWMGTOcj3jdunWrVSUCAACgGuIWJs8sn0QtSf7+/urSpYtuvvlmJSYmav78+XrvvfecL5YDAAAAUDVY2kAUFRVpzZo1Wrp0qTIyMrR27VrFxMSoU6dOeuutt9S5c2crywMAAEA15CCC8MiyBqJLly5au3atGjZsqM6dO+uRRx7RzJkzFR0dbVVJAAAAAM7DsgZi+fLlio6Odk6Y7ty5s2rVqmVVOQAAAIAkyXBYXUHVZtmbqI8ePaqpU6cqMDBQL7/8surWras2bdroscce06xZs3Tw4EGrSgMAAABQDssSiKCgIN1666269dZbJUnHjx/XihUrtHTpUk2aNEn9+vVT06ZNtWXLFqtKBAAAQDVkMAfCI8sSiN8KCgpSeHi4wsPDVbNmTfn4+Gj79u1WlwUAAADAhWUJhMPh0H//+19lZGRo6dKlWrlypQoKCnTVVVcpMTFRb7/9thITE60qDwAAANWUgzkQHlnWQISFhamgoEBRUVFKTEzUG2+8oYSEBDVu3NiqkgAAAACch2UNxCuvvKLExEQ1a9bMqhIAAACAMpgD4ZllDcQjjzxi1akBAAAAXCRL30QNAAAAVDUOAgiPqsxTmAAAAABUfSQQAAAAgAuDCMIjEggAAAAAppFAAAAAAC54CJNnJBAAAAAATKOBAAAAAGAatzABAAAALhxMovaIBAIAAACAaSQQAAAAgAuDWdQekUAAAAAAMI0EAgAAAHBhOKyuoGojgQAAAABgGgkEAAAA4MLBHAiPSCAAAAAAmEYCAQAAALjgKUyekUAAAAAAMI0EAgAAAHDBm6g9I4EAAAAAYBoJBAAAAOCCKRCekUAAAAAAMI0EAgAAAHBhMAfCIxIIAAAAAKaRQAAAAAAueBO1ZyQQAAAAAEyjgQAAAABgGrcwAQAAAC6YRO0ZCQQAAAAA00ggAAAAABckEJ6RQAAAAAAwjQQCAAAAcEEA4RkJBAAAAADTSCAAAAAAF8yB8IwEAgAAAIBpJBAAAACAC8MggfCEBAIAAACAaSQQAAAAgAsHcyA8IoEAAAAAYBoJBAAAAOCCORCekUAAAAAAMI0EAgAAAHDBeyA8I4EAAAAAYBoNBAAAAODCcBiVtlyItLQ0tW/fXjVq1FBERIR69+6trKwst21Onz6tlJQU1apVS8HBwerbt69yc3Pdttm7d6+Sk5MVGBioiIgIPfnkkyopKTFdBw0EAAAAcBnIzMxUSkqK1qxZo/T0dBUXF6t79+4qKChwbjNixAjNnTtXn3/+uTIzM3XgwAH16dPHub60tFTJyckqKirSqlWrNGPGDE2fPl3PPfec6TpsxhU4zfzm2zOtLgEAKlTqN4OsLgEAKlRycdb5N7LIA+Nyz79RBZk+LvKi9z148KAiIiKUmZmpTp066dixY6pTp45mzpypO++8U5K0Y8cOtWzZUqtXr1bHjh01f/583XbbbTpw4IAiI8+c+91339Xo0aN18OBB+fn5nfe8JBAAAACARQoLC5Wfn++2FBYWmtr32LFjkqTw8HBJ0oYNG1RcXKxu3bo5t2nRooXq16+v1atXS5JWr16tNm3aOJsHSUpKSlJ+fr62bt1q6rw0EAAAAIBF0tLSFBoa6rakpaWddz+Hw6Hhw4frpptuUuvWrSVJOTk58vPzU1hYmNu2kZGRysnJcW7j2jycXX92nRk8xhUAAABwUZmPcU19JlUjR450G7Pb7efdLyUlRVu2bNGKFSt+r9LKRQMBAAAAWMRut5tqGFw99thjmjdvnpYtW6Z69eo5x6OiolRUVKSjR4+6pRC5ubmKiopybrNu3Tq34519StPZbc6HW5gAAAAAF4ZhVNpyoXU99thjmjNnjpYsWaKGDRu6rW/Xrp18fX21ePFi51hWVpb27t2r+Ph4SVJ8fLw2b96svLw85zbp6ekKCQlRXFycqTpIIAAAAIDLQEpKimbOnKkvv/xSNWrUcM5ZCA0NVUBAgEJDQzVw4ECNHDlS4eHhCgkJ0dChQxUfH6+OHTtKkrp37664uDjdf//9mjRpknJycjRmzBilpKSYTkJoIAAAAAAXjkqcA3EhpkyZIklKSEhwG582bZoeeOABSdIbb7whLy8v9e3bV4WFhUpKStI777zj3Nbb21vz5s3TkCFDFB8fr6CgIA0YMEATJkwwXQcNBAAAAHAZMHPLk7+/v95++229/fbb5W4TGxurr7/++qLroIEAAAAAXFTmU5guR0yiBgAAAGAaCQQAAADg4kKfjlTdkEAAAAAAMI0EAgAAAHBhOBxWl1ClkUAAAAAAMI0EAgAAAHBRVd8DUVWQQAAAAAAwjQQCAAAAcMFTmDwjgQAAAABgGgkEAAAA4II3UXtGAgEAAADANBoIAAAAAKZxCxMAAADggluYPCOBAAAAAGAaCQQAAADgwmE4rC6hSiOBAAAAAGAaCQQAAADggjkQnpFAAAAAADCNBAIAAABwQQLhGQkEAAAAANNIIAAAAAAXhkEC4QkJBAAAAADTSCAAAAAAFw4H74HwhAQCAAAAgGkkEAAAAIALnsLkGQkEAAAAANNIIAAAAAAXhsEcCE9IIAAAAACYRgIBAAAAuGAOhGckEAAAAABMI4EAAAAAXJBAeEYCAQAAAMA0GggAAAAApnELEwAAAODCwWNcPSKBAAAAAGAaCQQAAADggknUnpFAAAAAADCNBAIAAABwYTiYA+EJCQQAAAAA00ggAAAAABfMgfCMBAIAAACAaSQQAAAAgAuD90B4RAIBAAAAwDQSCAAAAMCFgzkQHpFAAAAAADCNBAIAAABwwXsgPCOBAAAAAGAaCQQAAADggvdAeEYCAQAAAMA0EggAAADABe+B8IwEAgAAAIBpNBAAAAAATOMWJgAAAMAFk6g9I4EAAAAAYBoJBAAAAOCCF8l5RgIBAAAAwDSbYRjc5AVchMLCQqWlpSk1NVV2u93qcgDgkvHvGgAzaCCAi5Sfn6/Q0FAdO3ZMISEhVpcDAJeMf9cAmMEtTAAAAABMo4EAAAAAYBoNBAAAAADTaCCAi2S32zV27FgmGgK4YvDvGgAzmEQNAAAAwDQSCAAAAACm0UAAAAAAMI0GAgAAAIBpNBAAAAAATKOBQLWQk5OjoUOHqlGjRrLb7YqJidHtt9+uxYsXW11aGdOnT1dYWJjVZQCo4t59913VqFFDJSUlzrETJ07I19dXCQkJbttmZGTIZrNp9+7dlVwlgCsRDQSueHv27FG7du20ZMkSvfLKK9q8ebO++eYbJSYmKiUl5aKOWVRUdM7x4uLiSykVAExLTEzUiRMn9N///tc5tnz5ckVFRWnt2rU6ffq0c3zp0qWqX7++Gjdu7HaM8v4tAwBPaCBwxXv00Udls9m0bt069e3bV82aNVOrVq00cuRIrVmzRpK0d+9e9erVS8HBwQoJCdFdd92l3Nxc5zHGjRuna665Rv/4xz/UsGFD+fv7S5JsNpumTJmiO+64Q0FBQXrxxRclSV9++aWuu+46+fv7q1GjRho/frzbbwmPHj2qRx55RJGRkfL391fr1q01b948ZWRk6MEHH9SxY8dks9lks9k0bty4yrtYAC4bzZs3V3R0tDIyMpxjGRkZ6tWrlxo2bOj89+3seGJioh544AH17t1bL774ourWravmzZtLkjZv3qwuXbooICBAtWrV0qBBg3TixAnn/mf3e/XVVxUdHa1atWopJSXF7Zcm2dnZSk5OVkBAgBo2bKiZM2eqQYMGmjx58u9+LQBULhoIXNEOHz6sb775RikpKQoKCiqzPiwsTA6HQ7169dLhw4eVmZmp9PR0/fjjj7r77rvdtt21a5dmz56tL774Qhs3bnSOjxs3Tn/84x+1efNm/eUvf9Hy5cvVv39/DRs2TNu2bdN7772n6dOnO5sLh8OhHj16aOXKlfroo4+0bds2vfTSS/L29taNN96oyZMnKyQkRNnZ2crOztYTTzzxu14jAJevxMRELV261Pl56dKlSkhIUOfOnZ3jp06d0tq1a5WYmChJWrx4sbKyspSenq558+apoKBASUlJqlmzptavX6/PP/9cixYt0mOPPeZ2rqVLl2r37t1aunSpZsyYoenTp2v69OnO9f3799eBAweUkZGh2bNna+rUqcrLy/v9LwKAymcAV7C1a9cakowvvvii3G0WLlxoeHt7G3v37nWObd261ZBkrFu3zjAMwxg7dqzh6+tr5OXlue0ryRg+fLjbWNeuXY2JEye6jX344YdGdHS0YRiGsWDBAsPLy8vIyso6Zz3Tpk0zQkNDTX9HANXX3//+dyMoKMgoLi428vPzDR8fHyMvL8+YOXOm0alTJ8MwDGPx4sWGJOPnn382BgwYYERGRhqFhYXOY0ydOtWoWbOmceLECefYV199ZXh5eRk5OTmGYRjGgAEDjNjYWKOkpMS5zZ/+9Cfj7rvvNgzDMLZv325IMtavX+9cv3PnTkOS8cYbb/yelwCABUggcEUzTLxoffv27YqJiVFMTIxzLC4uTmFhYdq+fbtzLDY2VnXq1Cmz//XXX+/2edOmTZowYYKCg4Ody8MPP6zs7GydPHlSGzduVL169dSsWbNL+GYAICUkJKigoEDr16/X8uXL1axZM9WpU0edO3d2zoPIyMhQo0aNVL9+fUlSmzZt5Ofn5zzG9u3bdfXVV7ultDfddJMcDoeysrKcY61atZK3t7fzc3R0tDNhyMrKko+Pj6677jrn+iZNmqhmzZq/23cHYB0fqwsAfk9NmzaVzWbTjh07LvlY57oF6lzjJ06c0Pjx49WnT58y2/r7+ysgIOCSawEA6cwP6fXq1dPSpUt15MgRde7cWZJUt25dxcTEaNWqVVq6dKm6dOni3Ke8f8vOx9fX1+2zzWaTw+G4+OIBXLZIIHBFCw8PV1JSkt5++20VFBSUWX/06FG1bNlS+/bt0759+5zj27Zt09GjRxUXF3fB57zuuuuUlZWlJk2alFm8vLzUtm1b/fLLL/rhhx/Oub+fn59KS0sv+LwAqqfExERlZGQoIyPD7fGtnTp10vz587Vu3Trn/IdzadmypTZt2uT2b+TKlSvl5eXlnGR9Ps2bN1dJSYm+++4759iuXbt05MiRC/9CAKo8Gghc8d5++22Vlpbqhhtu0OzZs7Vz505t375df/vb3xQfH69u3bqpTZs26tevn7799lutW7dO/fv3V+fOncvcnmTGc889pw8++EDjx4/X1q1btX37dn3yyScaM2aMJKlz587q1KmT+vbtq/T0dP3000+aP3++vvnmG0lSgwYNdOLECS1evFi//vqrTp48WaHXA8CVJTExUStWrNDGjRudCYR05t+a9957T0VFRR4biH79+snf318DBgzQli1btHTpUg0dOlT333+/IiMjTdXQokULdevWTYMGDdK6dev03XffadCgQQoICJDNZrvk7wigaqGBwBWvUaNG+vbbb5WYmKhRo0apdevWuuWWW7R48WJNmTJFNptNX375pWrWrKlOnTqpW7duatSokT799NOLOl9SUpLmzZunhQsXqn379urYsaPeeOMNxcbGOreZPXu22rdvr3vvvVdxcXF66qmnnKnDjTfeqMGDB+vuu+9WnTp1NGnSpAq5DgCuTImJiTp16pSaNGni9gN/586ddfz4cefjXssTGBioBQsW6PDhw2rfvr3uvPNOde3aVW+99dYF1fHBBx8oMjJSnTp10h//+Ec9/PDDqlGjhvOx1wCuHDbDzCxTAACAC/DLL78oJiZGixYtUteuXa0uB0AFooEAAACXbMmSJTpx4oTatGmj7OxsPfXUU9q/f79++OGHMhOwAVzeeAoTAAC4ZMXFxfrrX/+qH3/8UTVq1NCNN96ojz/+mOYBuAKRQAAAAAAwjUnUAAAAAEyjgQAAAABgGg0EAAAAANNoIAAAAACYRgMBAAAAwDQaCACoRDabTf/+978v+3MAAKovGggAAAAAptFAAAAAADCNBgIAKlBCQoIef/xxPfXUUwoPD1dUVJTGjRtX7va//PKL7r33XoWHhysoKEjXX3+91q5d61w/ZcoUNW7cWH5+fmrevLk+/PBDt/137typTp06yd/fX3FxcUpPTy9zjn379umuu+5SWFiYwsPD1atXL+3Zs6eivjIAoJqhgQCACjZjxgwFBQVp7dq1mjRpkiZMmHDOH+xPnDihzp07a//+/frPf/6jTZs26amnnpLD4ZAkzZkzR8OGDdOoUaO0ZcsWPfLII3rwwQe1dOlSSZLD4VCfPn3k5+entWvX6t1339Xo0aPdzlFcXKykpCTVqFFDy5cv18qVKxUcHKxbb71VRUVFv//FAABccWyGYRhWFwEAV4qEhASVlpZq+fLlzrEbbrhBXbp00UsvvSSbzaY5c+aod+/emjp1qp544gnt2bNH4eHhZY510003qVWrVpo6dapz7K677lJBQYG++uorLVy4UMnJyfr5559Vt25dSdI333yjHj16OM/x0Ucf6YUXXtD27dtls9kkSUVFRQoLC9O///1vde/e/Xe+IgCAKw0JBABUsLZt27p9jo6OVl5eXpntNm7cqGuvvfaczYMkbd++XTfddJPb2E033aTt27c718fExDibB0mKj493237Tpk3atWuXatSooeDgYAUHBys8PFynT5/W7t27L+r7AQCqNx+rCwCAK42vr6/bZ5vN5rwtyVVAQMDvXsuJEyfUrl07ffzxx2XW1alT53c/PwDgykMCAQAWadu2rTZu3KjDhw+fc33Lli21cuVKt7GVK1cqLi7OuX7fvn3Kzs52rl+zZo3b9tddd5127typiIgINWnSxG0JDQ2t4G8EAKgOaCAAwCL33nuvoqKi1Lt3b61cuVI//vijZs+erdWrV0uSnnzySU2fPl1TpkzRzp079frrr+uLL77QE088IUnq1q2bmjVrpgEDBmjTpk1avny5nnnmGbdz9OvXT7Vr11avXr20fPly/fTTT8rIyNDjjz+uX375pdK/MwDg8kcDAQAW8fPz08KFCxUREaGePXuqTZs2eumll+Tt7S1J6t27t9588029+uqratWqld577z1NmzZNCQkJkiQvLy/NmTNHp06d0g033KCHHnpIL774ots5AgMDtWzZMtWvX199+vRRy5YtNXDgQJ0+fVohISGV/ZUBAFcAnsIEAAAAwDQSCAAAAACm0UAAAAAAMI0GAgAAAIBpNBAAAAAATKOBAAAAAGAaDQQAAAAA02ggAAAAAJhGAwEAAADANBoIAAAAAKbRQAAAAAAwjQYCAAAAgGn/D2EuWu1Y2vf7AAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 1000x700 with 2 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "from reasoner import retrieve_answer_math\n",
    "\n",
    "model_name = 'gpt-4o-mini'\n",
    "# model_name = 'meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo'\n",
    "dataset_list = ['algebra', 'counting & probability', 'geometry', 'number theory', 'intermediate algebra','precalculus', 'prealgebra']\n",
    "\n",
    "method_1 = 'cot'\n",
    "method_2 = 'nlcode'\n",
    "\n",
    "all_answers = retrieve_answer_math(model_name)\n",
    "records = {\n",
    "    f'{method_1}_correct_{method_2}_correct': 0,\n",
    "    f'{method_1}_correct_{method_2}_wrong': 0,\n",
    "    f'{method_1}_wrong_{method_2}_correct': 0,\n",
    "    f'{method_1}_wrong_{method_2}_wrong': 0\n",
    "}\n",
    "\n",
    "answers_1 = all_answers[method_1]\n",
    "answers_2 = all_answers[method_2]\n",
    "\n",
    "for dataset in dataset_list:\n",
    "    keys = list(answers_1[dataset].keys())\n",
    "    for i in keys:\n",
    "        # print(f'{answers_1[dataset]}')\n",
    "        if answers_1[dataset][i]['correct'] == answers_2[dataset][i]['correct']:\n",
    "            if answers_1[dataset][i]['correct']:\n",
    "                records[f'{method_1}_correct_{method_2}_correct'] += 1\n",
    "            else:\n",
    "                records[f'{method_1}_wrong_{method_2}_wrong'] += 1\n",
    "        else:\n",
    "            if answers_1[dataset][i]['correct']:\n",
    "                records[f'{method_1}_correct_{method_2}_wrong'] += 1\n",
    "            else:\n",
    "                records[f'{method_1}_wrong_{method_2}_correct'] += 1\n",
    "    \n",
    "for key, value in records.items():\n",
    "    print(f'{key}: {value}')\n",
    "\n",
    "# plot a metrix\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "\n",
    "data = np.array([[records[f'{method_1}_correct_{method_2}_correct'], records[f'{method_1}_correct_{method_2}_wrong']],\n",
    "                 [records[f'{method_1}_wrong_{method_2}_correct'], records[f'{method_1}_wrong_{method_2}_wrong']]])\n",
    "df_cm = pd.DataFrame(data, columns=['Correct', 'Wrong'], index=['Correct', 'Wrong'])\n",
    "plt.figure(figsize=(10,7))\n",
    "sns.heatmap(df_cm, annot=True, fmt='d', cmap='coolwarm')\n",
    "plt.xlabel(f'{method_2}')\n",
    "plt.ylabel(f'{method_1}')\n",
    "plt.title(f'{method_1} vs {method_2}, {model_name}')\n",
    "\n",
    "plt.savefig(f'analysis/{model_name}_{method_1}_vs_{method_2}.png')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## COT vs CodeNL"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## LLama3.1 8B"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import numpy as np\n",
    "\n",
    "# file_name = 'analysis/gpt-4o-mini_cot_wrong.json'\n",
    "file_name = 'analysis/Meta-Llama-3.1-8B-Instruct-Turbo_cot_wrong.json'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "25\n",
      "cot_wrong\n"
     ]
    }
   ],
   "source": [
    "start_idx = 0\n",
    "data = json.load(open(file_name))\n",
    "print(len(data))\n",
    "print(data[0]['type'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 0\n",
      "subset: precalculus\n",
      "idx: 463\n",
      "question: A line passing through the point $(1,1,1)$ intersects the line defined by\n",
      "\\[\\begin{pmatrix} 1 \\\\ 2 \\\\ 3 \\end{pmatrix} + t \\begin{pmatrix} 2 \\\\ 3 \\\\ 4 \\end{pmatrix}\\]at $P,$ and intersects the line defined by\n",
      "\\[\\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]at $Q.$  Find point $Q.$\n",
      "ground_truth: (7,21,35)\n",
      "------------COT-------------\n",
      "i: 0\n",
      "cot_answer: 2\n",
      "cot_rp: To find point Q, we can follow these steps:\n",
      "\n",
      "Let's denote the line passing through the point (1,1,1) as l. The direction vector of l is not given, but we can find it using the point (1,1,1) and another point P on the line.\n",
      "\n",
      "Since P lies on the line defined by the vector (2,3,4), we can write the equation of the line l as:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} a \\\\ b \\\\ c \\end{pmatrix}\\]\n",
      "\n",
      "where (a,b,c) is the direction vector of the line l.\n",
      "\n",
      "Since P lies on the line defined by the vector (2,3,4), we can write:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} a \\\\ b \\\\ c \\end{pmatrix} = \\begin{pmatrix} 1 \\\\ 2 \\\\ 3 \\end{pmatrix} + t \\begin{pmatrix} 2 \\\\ 3 \\\\ 4 \\end{pmatrix}\\]\n",
      "\n",
      "Equating the x, y, and z components, we get:\n",
      "\n",
      "\\[1 + ka = 1 + 2t\\]\n",
      "\\[1 + kb = 2 + 3t\\]\n",
      "\\[1 + kc = 3 + 4t\\]\n",
      "\n",
      "Solving for a, b, and c, we get:\n",
      "\n",
      "\\[a = 2 + 2t\\]\n",
      "\\[b = 3 + 3t\\]\n",
      "\\[c = 4 + 4t\\]\n",
      "\n",
      "Substituting these values of a, b, and c into the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 2 + 2t \\\\ 3 + 3t \\\\ 4 + 4t \\end{pmatrix}\\]\n",
      "\n",
      "Now, let's find the intersection point Q of the line l and the line defined by the vector (-2,3,-1).\n",
      "\n",
      "The direction vector of this line is (1,2,4). We can write the equation of this line as:\n",
      "\n",
      "\\[\\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]\n",
      "\n",
      "Equating this with the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 2 + 2t \\\\ 3 + 3t \\\\ 4 + 4t \\end{pmatrix} = \\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]\n",
      "\n",
      "Equating the x, y, and z components, we get:\n",
      "\n",
      "\\[1 + k(2 + 2t) = -2 + s\\]\n",
      "\\[1 + k(3 + 3t) = 3 + 2s\\]\n",
      "\\[1 + k(4 + 4t) = -1 + 4s\\]\n",
      "\n",
      "Solving for s, we get:\n",
      "\n",
      "\\[s = \\frac{3 + k(2 + 2t)}{3}\\]\n",
      "\\[s = \\frac{2 + k(3 + 3t)}{2}\\]\n",
      "\\[s = \\frac{2 + k(4 + 4t)}{4}\\]\n",
      "\n",
      "Equating the values of s from the first two equations, we get:\n",
      "\n",
      "\\[\\frac{3 + k(2 + 2t)}{3} = \\frac{2 + k(3 + 3t)}{2}\\]\n",
      "\n",
      "Solving for k, we get:\n",
      "\n",
      "\\[6 + 6k + 6kt = 6 + 3k + 9kt\\]\n",
      "\n",
      "\\[3k - 3kt = 0\\]\n",
      "\n",
      "\\[k(3 - 3t) = 0\\]\n",
      "\n",
      "\\[k = 0 \\text{ or } t = 1\\]\n",
      "\n",
      "If k = 0, then the point P is (1,1,1). This is not possible, since P is the intersection point of the two lines.\n",
      "\n",
      "So, t = 1.\n",
      "\n",
      "Substituting t = 1 into the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix}\\]\n",
      "\n",
      "Equating this with the equation of the line defined by the vector (-2,3,-1), we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix} = \\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]\n",
      "\n",
      "Equating the x, y, and z components, we get:\n",
      "\n",
      "\\[1 + 4k = -2 + s\\]\n",
      "\\[1 + 6k = 3 + 2s\\]\n",
      "\\[1 + 8k = -1 + 4s\\]\n",
      "\n",
      "Solving for s, we get:\n",
      "\n",
      "\\[s = \\frac{3 + 4k}{3}\\]\n",
      "\\[s = \\frac{2 + 3k}{2}\\]\n",
      "\\[s = \\frac{2 + 2k}{4}\\]\n",
      "\n",
      "Equating the values of s from the first two equations, we get:\n",
      "\n",
      "\\[\\frac{3 + 4k}{3} = \\frac{2 + 3k}{2}\\]\n",
      "\n",
      "Solving for k, we get:\n",
      "\n",
      "\\[6 + 24k = 6 + 9k\\]\n",
      "\n",
      "\\[15k = 0\\]\n",
      "\n",
      "\\[k = 0\\]\n",
      "\n",
      "Substituting k = 0 into the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + 0 \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix}\\]\n",
      "\n",
      "\\[= \\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix}\\]\n",
      "\n",
      "So, the point P is (1,1,1).\n",
      "\n",
      "This is not possible, since P is the intersection point of the two lines.\n",
      "\n",
      "So, we must have k ≠ 0.\n",
      "\n",
      "Substituting k ≠ 0 into the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix}\\]\n",
      "\n",
      "Equating this with the equation of the line defined by the vector (-2,3,-1), we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + k \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix} = \\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]\n",
      "\n",
      "Equating the x, y, and z components, we get:\n",
      "\n",
      "\\[1 + 4k = -2 + s\\]\n",
      "\\[1 + 6k = 3 + 2s\\]\n",
      "\\[1 + 8k = -1 + 4s\\]\n",
      "\n",
      "Solving for s, we get:\n",
      "\n",
      "\\[s = \\frac{3 + 4k}{3}\\]\n",
      "\\[s = \\frac{2 + 3k}{2}\\]\n",
      "\\[s = \\frac{2 + 2k}{4}\\]\n",
      "\n",
      "Equating the values of s from the first two equations, we get:\n",
      "\n",
      "\\[\\frac{3 + 4k}{3} = \\frac{2 + 3k}{2}\\]\n",
      "\n",
      "Solving for k, we get:\n",
      "\n",
      "\\[6 + 24k = 6 + 9k\\]\n",
      "\n",
      "\\[15k = 0\\]\n",
      "\n",
      "This is a contradiction, since we assumed k ≠ 0.\n",
      "\n",
      "So, we must have k = 0.\n",
      "\n",
      "Substituting k = 0 into the equation of the line l, we get:\n",
      "\n",
      "\\[\\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix} + 0 \\begin{pmatrix} 4 \\\\ 6 \\\\ 8 \\end{pmatrix}\\]\n",
      "\n",
      "\\[= \\begin{pmatrix} 1 \\\\ 1 \\\\ 1 \\end{pmatrix}\\]\n",
      "\n",
      "So, the point P is (1,1,1).\n",
      "\n",
      "This is not possible, since P is the intersection point of the two lines.\n",
      "\n",
      "However, we can find the point Q by using the parametric equation of the line defined by the vector (-2,3,-1).\n",
      "\n",
      "The point Q is given by the vector (-2,3,-1) + s(1,2,4).\n",
      "\n",
      "So, the point Q is (-2 + s, 3 + 2s, -1 + 4s).\n",
      "\n",
      "The point Q must also lie on the line defined by the vector (2,3,4).\n",
      "\n",
      "So, we can write the equation of the line defined by the vector (2,3,4) as:\n",
      "\n",
      "\\[\\begin{pmatrix} 2 \\\\ \n",
      "------------CodeNL-------------\n",
      "i: 0\n",
      "codenl_answer: 75\n",
      "codenl is correct: False\n",
      "codenl_rp: python\n",
      "from sympy import symbols, Matrix, Eq, solve\n",
      "\n",
      "def solution():\n",
      "    \"\"\"A line passing through the point $(1,1,1)$ intersects the line defined by\n",
      "    \\[\\begin{pmatrix} 1 \\\\ 2 \\\\ 3 \\end{pmatrix} + t \\begin{pmatrix} 2 \\\\ 3 \\\\ 4 \\end{pmatrix}\\]\n",
      "    at $P,$ and intersects the line defined by\n",
      "    \\[\\begin{pmatrix} -2 \\\\ 3 \\\\ -1 \\end{pmatrix} + s \\begin{pmatrix} 1 \\\\ 2 \\\\ 4 \\end{pmatrix}\\]\n",
      "    at $Q.$  Find point $Q.$\"\"\"\n",
      "    x, y, z = symbols('x y z')\n",
      "    t = symbols('t')\n",
      "    s = symbols('s')\n",
      "\n",
      "    # Define the parametric equations for the lines\n",
      "    P = Matrix([1, 1, 1]) + t * Matrix([2, 3, 4])\n",
      "    Q = Matrix([-2, 3, -1]) + s * Matrix([1, 2, 4])\n",
      "\n",
      "    # Equate the x, y, and z coordinates of the two points\n",
      "    eq1 = Eq(P[0], Q[0])\n",
      "    eq2 = Eq(P[1], Q[1])\n",
      "    eq3 = Eq(P[2], Q[2])\n",
      "\n",
      "    # Solve the system of equations for s and t\n",
      "    sol = solve((eq1, eq2, eq3), (s, t))\n",
      "\n",
      "    # Substitute the values of s and t into the equation for Q\n",
      "    Q = Matrix([-2, 3, -1]) + sol[s] * Matrix([1, 2, 4])\n",
      "    result = Q\n",
      "    return result\n",
      "\n",
      "To find the point Q, we need to find the values of s and t that make the two lines intersect. We can do this by equating the coordinates of the two points P and Q.\n",
      "\n",
      "Step-by-step reasoning:\n",
      "1. The parametric equations for the lines are:\n",
      "   - Line 1: \\( P = (1, 1, 1) + t(2, 3, 4) = (1 + 2t, 1 + 3t, 1 + 4t) \\)\n",
      "   - Line 2: \\( Q = (-2, 3, -1) + s(1, 2, 4) = (-2 + s, 3 + 2s, -1 + 4s) \\)\n",
      "\n",
      "2. Since the lines intersect, the coordinates of P and Q are the same. We can equate the x, y, and z coordinates of the two points:\n",
      "   - \\( 1 + 2t = -2 + s \\)\n",
      "   - \\( 1 + 3t = 3 + 2s \\)\n",
      "   - \\( 1 + 4t = -1 + 4s \\)\n",
      "\n",
      "3. We can solve this system of equations for s and t. Subtracting the first equation from the second equation, we get:\n",
      "   - \\( 3t - 2s = 4 \\)\n",
      "\n",
      "   Subtracting the first equation from the third equation, we get:\n",
      "   - \\( 4t - 3s = 2 \\)\n",
      "\n",
      "4. We can solve this system of equations using substitution or elimination. Let's use elimination. Multiplying the first equation by 3 and the second equation by 2, we get:\n",
      "   - \\( 9t - 6s = 12 \\)\n",
      "   - \\( 8t - 6s = 4 \\)\n",
      "\n",
      "   Subtracting the second equation from the first equation, we get:\n",
      "   - \\( t = 8 \\)\n",
      "\n",
      "5. Substituting t = 8 into one of the original equations, we can solve for s. Let's use the first equation:\n",
      "   - \\( 1 + 2(8) = -2 + s \\)\n",
      "   - \\( 17 = -2 + s \\)\n",
      "   - \\( s = 19 \\)\n",
      "\n",
      "6. Now that we have the values of s and t, we can substitute them into the equation for Q:\n",
      "   - \\( Q = (-2, 3, -1) + 19(1, 2, 4) \\)\n",
      "   - \\( Q = (-2 + 19, 3 + 38, -1 + 76) \\)\n",
      "   - \\( Q = (17, 41, 75) \\)\n",
      "\n",
      "Therefore, the final answer is:\n",
      "\\[oxed{(17, 41, 75)} \\]\n"
     ]
    }
   ],
   "source": [
    "i = 0\n",
    "\n",
    "print('i:', i)\n",
    "sample = data[i]\n",
    "print('subset:', sample['subset'])\n",
    "print('idx:', sample['idx'])\n",
    "print('question:', sample['question'])\n",
    "print('ground_truth:', sample['ground_truth'])\n",
    "\n",
    "print('------------COT-------------')\n",
    "print('i:', i)\n",
    "if sample['cot_answer'] == '':\n",
    "    print('when running PAL, execution failed!')\n",
    "else:\n",
    "    print('cot_answer:', sample['cot_answer'])\n",
    "print('cot_rp:', sample['cot_rp'].replace('```', ''))\n",
    "\n",
    "# flag = input('Press enter to continue')\n",
    "# if flag == 'q':\n",
    "#     break\n",
    "\n",
    "print('------------CodeNL-------------')\n",
    "print('i:', i)\n",
    "if sample['codenl_answer'] == '':\n",
    "    print('when running NLCode, execution failed!')\n",
    "else:\n",
    "    print('codenl_answer:', sample['codenl_answer'])\n",
    "print('codenl is correct:', sample['codenl_correct'])\n",
    "print('codenl_rp:', sample['codenl_rp'].replace('```', ''))\n",
    "# print('nlcode_rp:', sample['nlcode_rp'])\n",
    "# flag = input('Press enter to continue')\n",
    "# if flag == 'q':\n",
    "#     break    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## One right one wrong"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {},
   "outputs": [],
   "source": [
    "right = 'nlcode'\n",
    "wrong = 'cot'\n",
    "\n",
    "file = 'analysis/gpt-4o-mini_{right}_correct_{wrong}_wrong.json'.format(right=right, wrong=wrong)\n",
    "data = json.load(open(file))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 8\n",
      "subset: algebra\n",
      "idx: 1109\n",
      "question: Diana can either invest $20,\\!000$ dollars for $4$ years with a simple interest rate of $6\\%$ or an interest rate of $7\\%$ which compounds quarterly. How many more dollars, rounded to the nearest dollar, would she get with the better interest rate than with the worse one?\n",
      "ground_truth: 1599\n",
      "------------correct method-------------\n",
      "i: 8\n",
      "nlcode method is correct\n",
      "nlcode_answer: 1599\n",
      "nlcode_rp: Let's think step by step.\n",
      "\n",
      "1. **Calculating the simple interest for the first investment**:\n",
      "   - Principal amount \\( P = 20000 \\) dollars.\n",
      "   - Interest rate \\( r = 0.06 \\) (6%).\n",
      "   - Time \\( t = 4 \\) years.\n",
      "   - The formula for simple interest is given by:\n",
      "     \\[\n",
      "     A = P(1 + rt)\n",
      "     \\]\n",
      "   - Substituting the values:\n",
      "     \\[\n",
      "     A = 20000 \\left(1 + 0.06 \\cdot 4\\right) = 20000 \\left(1 + 0.24\\right) = 20000 \\cdot 1.24 = 24800\n",
      "     \\]\n",
      "\n",
      "2. **Calculating the compound interest for the second investment**:\n",
      "   - Principal amount \\( P = 20000 \\) dollars.\n",
      "   - Interest rate \\( r = 0.07 \\) (7%).\n",
      "   - Compounding quarterly means \\( n = 4 \\) (number of times interest applied per year).\n",
      "   - Time \\( t = 4 \\) years.\n",
      "   - The formula for compound interest is:\n",
      "     \\[\n",
      "     A = P \\left(1 + \\frac{r}{n}\\right)^{nt}\n",
      "     \\]\n",
      "   - Substituting the values:\n",
      "     \\[\n",
      "     A = 20000 \\left(1 + \\frac{0.07}{4}\\right)^{4 \\cdot 4} = 20000 \\left(1 + 0.0175\\right)^{16}\n",
      "     \\]\n",
      "     \\[\n",
      "     = 20000 \\left(1.0175\\right)^{16}\n",
      "     \\]\n",
      "\n",
      "3. **Calculating \\( (1.0175)^{16} \\)**:\n",
      "   - Using the binomial expansion or calculating directly, we find:\n",
      "     \\[\n",
      "     (1.0175)^{16} \\approx 1.348850\n",
      "     \\]\n",
      "   - Therefore, the amount after 4 years is:\n",
      "     \\[\n",
      "     A \\approx 20000 \\times 1.348850 \\approx 26977\n",
      "     \\]\n",
      "\n",
      "4. **Calculating the difference**:\n",
      "   - Now, we find the difference between the two amounts:\n",
      "     \\[\n",
      "     \\text{Difference} = 26977 - 24800 = 1977\n",
      "     \\]\n",
      "\n",
      "Thus, the amount Diana would get with the better interest rate compared to the worse one is \\(\\boxed{1977}\\).\n",
      "python\n",
      "from sympy import Rational\n",
      "\n",
      "def solution():\n",
      "    # Simple interest calculation\n",
      "    P = 20000  # Principal amount in dollars\n",
      "    r1 = Rational(6, 100)  # Simple interest rate (6%)\n",
      "    t = 4  # Time in years\n",
      "    \n",
      "    # Amount with simple interest\n",
      "    A_simple = P * (1 + r1 * t)\n",
      "    \n",
      "    # Compound interest calculation\n",
      "    r2 = Rational(7, 100)  # Compound interest rate (7%)\n",
      "    n = 4  # Compounded quarterly\n",
      "    # Amount with compound interest\n",
      "    A_compound = P * (1 + r2 / n)**(n * t)\n",
      "    \n",
      "    # Calculate the difference\n",
      "    difference = A_compound - A_simple\n",
      "    \n",
      "    return round(difference)\n",
      "\n",
      "\n",
      "------------wrong method-------------\n",
      "i: 8\n",
      "cot method is wrong\n",
      "cot_answer: 1977\n",
      "cot_rp: Let's think step by step.\n",
      "\n",
      "1. **Calculate the amount from the simple interest investment at 6% for 4 years.**\n",
      "   The formula for simple interest is:\n",
      "   \\[\n",
      "   A = P(1 + rt)\n",
      "   \\]\n",
      "   where \\( P \\) is the principal, \\( r \\) is the rate, and \\( t \\) is the time in years.\n",
      "   Here, \\( P = 20000 \\), \\( r = 0.06 \\), and \\( t = 4 \\):\n",
      "   \\[\n",
      "   A = 20000(1 + 0.06 \\cdot 4) = 20000(1 + 0.24) = 20000 \\cdot 1.24 = 24800.\n",
      "   \\]\n",
      "\n",
      "2. **Calculate the amount from the compound interest investment at 7% compounded quarterly.**\n",
      "   The formula for compound interest is:\n",
      "   \\[\n",
      "   A = P\\left(1 + \\frac{r}{n}\\right)^{nt}\n",
      "   \\]\n",
      "   where \\( P \\) is the principal, \\( r \\) is the annual interest rate, \\( n \\) is the number of times the interest is compounded per year, and \\( t \\) is the time in years.\n",
      "   Here, \\( P = 20000 \\), \\( r = 0.07 \\), \\( n = 4 \\), and \\( t = 4 \\):\n",
      "   \\[\n",
      "   A = 20000\\left(1 + \\frac{0.07}{4}\\right)^{4 \\cdot 4} = 20000\\left(1 + 0.0175\\right)^{16} = 20000(1.0175)^{16}.\n",
      "   \\]\n",
      "   Now we calculate \\( (1.0175)^{16} \\):\n",
      "   \\[\n",
      "   (1.0175)^{16} \\approx 1.348850.\n",
      "   \\]\n",
      "   Thus,\n",
      "   \\[\n",
      "   A \\approx 20000 \\cdot 1.348850 \\approx 26977.\n",
      "   \\]\n",
      "\n",
      "3. **Calculate the difference between the two amounts.**\n",
      "   The difference is:\n",
      "   \\[\n",
      "   26977 - 24800 = 1977.\n",
      "   \\]\n",
      "\n",
      "Therefore, the answer is:\n",
      "\\[\n",
      "\\boxed{1977}\n",
      "\\]\n"
     ]
    }
   ],
   "source": [
    "i = 0 # 0~19\n",
    "i = 8\n",
    "print('i:', i)\n",
    "sample = data[i]\n",
    "print('subset:', sample['subset'])\n",
    "print('idx:', sample['idx'])\n",
    "print('question:', sample['question'])\n",
    "print('ground_truth:', sample['ground_truth'])\n",
    "\n",
    "print('------------correct method-------------')\n",
    "print('i:', i)\n",
    "print(f'{right} method is correct'.format(right=right))\n",
    "print(f'{right}_answer:', sample[f'{right}_answer'])\n",
    "print(f'{right}_rp:', sample[f'{right}_rp'].replace('```', ''))\n",
    "\n",
    "\n",
    "# flag = input('Press enter to continue')\n",
    "# if flag == 'q':\n",
    "#     break\n",
    "\n",
    "print('------------wrong method-------------')\n",
    "print('i:', i)\n",
    "print(f'{wrong} method is wrong'.format(wrong=wrong))\n",
    "print(f'{wrong}_answer:', sample[f'{wrong}_answer'])\n",
    "print(f'{wrong}_rp:', sample[f'{wrong}_rp'].replace('```', ''))\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Method cot done\n",
      "Method pal done\n",
      "Method codenl done\n",
      "Method nlcode done\n"
     ]
    }
   ],
   "source": [
    "from reasoner import retrieve_answer_math\n",
    "\n",
    "model = 'gpt-4o-mini'\n",
    "data = retrieve_answer_math(model)\n",
    "\n",
    "method_1 = 'pal'\n",
    "method_2 = 'nlcode'\n",
    "method_3 = 'codenl'\n",
    "\n",
    "subset = 'algebra'\n",
    "idx = 708"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "What is the domain of the real-valued function $$q(x) = \\frac{\\sqrt{x}}{\\sqrt{1-x^2}}~?$$Express your answer as an interval or as a union of intervals.\n"
     ]
    }
   ],
   "source": [
    "print(data[method_1][subset][idx]['question'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------pal-------------\n",
      "correct: False\n",
      "answer: Interval(0, 1)\n",
      "rp: python\n",
      "from sympy import symbols, sqrt, Interval, S\n",
      "\n",
      "def solution():\n",
      "    \"\"\"What is the domain of the real-valued function $$q(x) = \\frac{\\sqrt{x}}{\\sqrt{1-x^2}}~?$$ Express your answer as an interval or as a union of intervals.\"\"\"\n",
      "    x = symbols('x')\n",
      "    \n",
      "    # Conditions for the function to be defined:\n",
      "    # 1. sqrt(x) is defined: x >= 0\n",
      "    # 2. sqrt(1 - x^2) is defined: 1 - x^2 > 0 => -1 < x < 1\n",
      "    \n",
      "    # Combine the intervals\n",
      "    domain = Interval(0, 1)  # Since x has to be non-negative and less than 1\n",
      "    \n",
      "    return domain\n",
      "\n"
     ]
    }
   ],
   "source": [
    "print('------------{method_1}-------------'.format(method_1=method_1))\n",
    "print('correct:', data[method_1][subset][idx]['correct'])\n",
    "print('answer:', data[method_1][subset][idx]['answer'])\n",
    "print('rp:', data[method_1][subset][idx]['reasoning_path'].replace('```', ''))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------nlcode-------------\n",
      "correct: False\n",
      "answer: \n",
      "rp: Let's think step by step about the function \\( q(x) = \\frac{\\sqrt{x}}{\\sqrt{1-x^2}} \\).\n",
      "\n",
      "1. **Identify the constraints from the numerator**: The expression \\(\\sqrt{x}\\) is defined for \\(x \\geq 0\\). Therefore, we have:\n",
      "   \\[\n",
      "   x \\geq 0.\n",
      "   \\]\n",
      "\n",
      "2. **Identify the constraints from the denominator**: The expression \\(\\sqrt{1-x^2}\\) is defined when \\(1-x^2 > 0\\). This simplifies to:\n",
      "   \\[\n",
      "   1 > x^2 \\quad \\Rightarrow \\quad -1 < x < 1.\n",
      "   \\]\n",
      "\n",
      "3. **Combine the constraints**: We need both conditions to hold:\n",
      "   - From the numerator: \\(x \\geq 0\\)\n",
      "   - From the denominator: \\(-1 < x < 1\\)\n",
      "\n",
      "   Combining these, we find:\n",
      "   \\[\n",
      "   0 \\leq x < 1.\n",
      "   \\]\n",
      "\n",
      "Thus, the domain of the function \\( q(x) \\) is:\n",
      "\\[\n",
      "[0, 1).\n",
      "\\]\n",
      "\n",
      "The final answer is \\(\\boxed{[0, 1)}\\).\n",
      "python\n",
      "from sympy import S\n",
      "\n",
      "def solution():\n",
      "    # The domain of the function q(x) = sqrt(x) / sqrt(1 - x^2)\n",
      "    # is derived from the constraints identified in the reasoning.\n",
      "    domain = S.Reals.intersect(S.Interval(0, 1, True, False))\n",
      "    return domain\n",
      "\n",
      "\n"
     ]
    }
   ],
   "source": [
    "print('------------{method_2}-------------'.format(method_2=method_2))\n",
    "\n",
    "print('correct:', data[method_2][subset][idx]['correct'])\n",
    "print('answer:', data[method_2][subset][idx]['answer'])\n",
    "print('rp:', data[method_2][subset][idx]['reasoning_path'].replace('```', ''))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "------------codenl-------------\n",
      "correct: True\n",
      "answer: [0,1)\n",
      "rp: python\n",
      "from sympy import symbols, sqrt, Interval, S\n",
      "\n",
      "def solution():\n",
      "    \"\"\"What is the domain of the real-valued function $$q(x) = \\frac{\\sqrt{x}}{\\sqrt{1-x^2}}~?$$ Express your answer as an interval or as a union of intervals.\"\"\"\n",
      "    x = symbols('x')\n",
      "    \n",
      "    # Determine the conditions for the function to be defined\n",
      "    condition1 = x >= 0  # sqrt(x) is defined for x >= 0\n",
      "    condition2 = 1 - x**2 > 0  # sqrt(1 - x^2) is defined for 1 - x^2 > 0\n",
      "    \n",
      "    # From condition2, we have -1 < x < 1\n",
      "    interval1 = Interval(0, 1)  # x must be >= 0 and < 1\n",
      "    \n",
      "    # The domain is [0, 1)\n",
      "    result = interval1\n",
      "    return result\n",
      "\n",
      "To determine the domain of the real-valued function \n",
      "\n",
      "\\[\n",
      "q(x) = \\frac{\\sqrt{x}}{\\sqrt{1-x^2}},\n",
      "\\]\n",
      "\n",
      "we need to analyze the conditions under which the function is defined.\n",
      "\n",
      "1. **Condition for the numerator**: The square root in the numerator, \\(\\sqrt{x}\\), is defined for \\(x \\geq 0\\).\n",
      "\n",
      "2. **Condition for the denominator**: The square root in the denominator, \\(\\sqrt{1-x^2}\\), is defined when \\(1 - x^2 > 0\\). This can be rewritten as:\n",
      "   \\[\n",
      "   1 > x^2 \\quad \\Rightarrow \\quad -1 < x < 1.\n",
      "   \\]\n",
      "\n",
      "3. **Combining conditions**: \n",
      "\n",
      "   - From the first condition, we have \\(x \\geq 0\\).\n",
      "   - From the second condition, we have \\(-1 < x < 1\\).\n",
      "\n",
      "   The valid range of \\(x\\) that satisfies both conditions is:\n",
      "   \\[\n",
      "   0 \\leq x < 1.\n",
      "   \\]\n",
      "\n",
      "Thus, the domain of the function \\(q(x)\\) can be expressed as the interval:\n",
      "\n",
      "\\[\n",
      "[0, 1).\n",
      "\\]\n",
      "\n",
      "Therefore, the final result is:\n",
      "\n",
      "\\[\n",
      "\\boxed{[0, 1)}\n",
      "\\]\n"
     ]
    }
   ],
   "source": [
    "\n",
    "print('------------{method_3}-------------'.format(method_3=method_3))\n",
    "\n",
    "print('correct:', data[method_3][subset][idx]['correct'])\n",
    "print('answer:', data[method_3][subset][idx]['answer'])\n",
    "print('rp:', data[method_3][subset][idx]['reasoning_path'].replace('```', ''))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "textgen",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
