{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "39d46115-4eb0-48ba-ba15-b0e80741ee9c",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "import csv\n",
    "import re\n",
    "ds = json.load(open('/home/XXXX/XXXX/SAT-LM/data/proofd5_test.json', 'r'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "574d9bd7-244c-4ae9-ad3e-83fa5fdd8aec",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "4e5182f1-5912-4546-94bc-0bc4e5ee6299",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'example_id': 22, 'premises': 'Miroslav Venhoda was a Czech choir instructor who specialized in the performance of Renaissance and Baroque music.\\nAny choral conductor is a musician.\\nSome musicians love music.\\nMiroslav Venhoda published a book in 1946 called Method of Studying Gregorian Chant.', 'conclusion': 'No choral conductor specialized in the performance of Renaissance.', 'premises-FOL': 'Czech(miroslav) ∧ ChoirInstructor(miroslav) ∧ SpecializeInPerformanceOf(miroslav, renaissanceMusic) ∧ SpecializeInPerformanceOf(miroslav, baroqueMusic)\\n∀x (ChoralConductor(x) → Musician(x))\\n∃x ∃y ((Musician(x) → Love(x, music)) \\nPublishedBook(miroslav, methodOfStudyingGregorianChant, yr1946)', 'conclusion-FOL': '∀x (ChoralConductor(x) → ¬SpecializeInPerformanceOf(x, renaissanceMusic))', 'label': 'false'}\n"
     ]
    }
   ],
   "source": [
    "print(ds[5])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "id": "485c91bf-fa1c-47be-82b5-e5d94780d092",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'1 sep 2012 I went out on and it was better than 15 jan 2012'"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "s = \"I went out on 1 sep 2012 and it was better than 15 jan 2012\"\n",
    "r = re.compile('(.*)(1 sep 2012 )(.*)')\n",
    "r.sub(r'\\2\\1\\3',s)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "7be80115-051a-4e2f-9075-c876ffab03c7",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "CargoShip(britta) ∧ Ship(britta) ∧ BuiltFor(britta, norwegians)\n",
      "ImpressedIntoServiceBy(britta, germany)\n",
      "∀x ∀y (Ship(x) ∧ ImpressedIntoServiceBy(x, y) → SeizedBy(x, y))\n",
      "SoldTo(britta, hongkong)\n",
      "∀x ∀y (SoldTo(x, hongkong) → ¬SeizedBy(x, y))\n",
      "--------------\n",
      "→  (Ship(x) ∧ ImpressedIntoServiceBy(x, y) → SeizedBy(x, y\n",
      "→  (SoldTo(x, hongkong) → ¬SeizedBy(x, y\n",
      "¬  (SoldTo(x, hongkong) → ¬SeizedBy(x, y\n",
      "['x', 'y'] ['britta', 'norwegians', 'germany', 'y', 'hongkong'] ['cargo_ship', 'ship', 'built_for', 'impressed_into_service_by', 'seized_by', 'sold_to']\n",
      "And(cargo_ship(britta), ship(britta), built_fOr(britta, norwegians))\n",
      "impressed_into_service_by(britta, germany)\n",
      "ForAll([x,y], Implies(And((ship(x), impressed_into_service_by(x, y)), seized_by(x, y))\n",
      "sold_to(britta, hongkong)\n",
      "ForAll([x,y], Implies((sold_to(x, hongkong), ¬seized_by(x, y))\n"
     ]
    }
   ],
   "source": [
    "import re\n",
    "\n",
    "# Function to convert first-order logic to desired format\n",
    "def convert_to_target_format(logic_str):\n",
    "    # Replace universal quantifier ∀x with ForAll([x], ...)\n",
    "    const = []\n",
    "    \n",
    "    if '∀' in logic_str:\n",
    "        for z in logic_str.split('∀'):\n",
    "            # print(z)\n",
    "            if len(z) == 0: continue\n",
    "            # print(z[0])\n",
    "            if z[0] not in const:\n",
    "                const.append(z[0])\n",
    "\n",
    "    # print(const)\n",
    "    # print(const)\n",
    "    for c in const:\n",
    "        logic_str = logic_str.replace('∀' + c, '').strip(' ')[1:-1]\n",
    "    \n",
    "    # print(logic_str)\n",
    "    r = re.compile(\"¬([^\\(][^ ][^\\)]*\\))\")\n",
    "    old_logic=logic_str\n",
    "    logic_str = r.sub(r\"Not(\\1)\", logic_str)\n",
    "    # print('look here:', logic_str)\n",
    "    # print(logic_str)\n",
    "    # print(old_logic)\n",
    "    while old_logic != logic_str:\n",
    "        # r = re.compile(\"¬([^\\(][^ ][.^\\(]*\\))\")\n",
    "        old_logic=logic_str\n",
    "        logic_str = r.sub(r\"Not(\\1)\", logic_str)\n",
    "        # print(logic_str)\n",
    "        # print(old_logic)\n",
    "    \n",
    "    last_op = ''\n",
    "    consec_or = 1\n",
    "    consec_and = 1\n",
    "    tmp_or = 1\n",
    "    tmp_and = 1\n",
    "    ops = ['∨', '∧', '¬', '→', '⊕']\n",
    "    for c in logic_str:\n",
    "        # print(c)\n",
    "        if c == '∨':\n",
    "            if last_op == '∨':\n",
    "                tmp_or += 1\n",
    "            last_op = '∨'\n",
    "            # print(last_op, c, last_op == c)\n",
    "        elif c in ops and c != '∨':\n",
    "            tmp_or = 1\n",
    "            last_op = ''\n",
    "            if consec_or < tmp_or: consec_or = temp_or\n",
    "            # print(c)\n",
    "    if consec_or < tmp_or: consec_or = temp_or\n",
    "\n",
    "    last_op = ''\n",
    "    for c in logic_str:\n",
    "        if c == '∧':\n",
    "            if last_op == '∧':\n",
    "                tmp_and += 1\n",
    "                # print(c, logic_str)\n",
    "\n",
    "            last_op = '∧'\n",
    "            \n",
    "        elif c in ops and c != '∧':\n",
    "            consec_and = 1\n",
    "            last_op = ''\n",
    "            if consec_and < tmp_and: consec_and = tmp_and\n",
    "            print(c, logic_str)\n",
    "    if consec_and < tmp_and: consec_and = tmp_and\n",
    "\n",
    "    rstr = ''\n",
    "    # print(consec_and)\n",
    "    if consec_and > 1:\n",
    "        for m in range(consec_and+1):\n",
    "            rstr += '([^ ]*\\([^\\(]*\\)) ∧ '\n",
    "        rstr = rstr[:-3]\n",
    "        r = re.compile(rstr)\n",
    "        rsubstr = r'And('\n",
    "        for m in range(1,1+1+consec_and):\n",
    "            rsubstr += '\\\\' + str(m) + ', '\n",
    "        rsubstr = rsubstr[:-2] + ')'\n",
    "        # logic_str = r.sub(r\n",
    "        logic_str = r.sub(rsubstr, logic_str)\n",
    "        # print(rsubstr)\n",
    "    if consec_or > 1:\n",
    "        for m in range(consec_or+1):\n",
    "            rstr += '([^ ]*\\([^\\(]*\\)) ∨ '\n",
    "        rstr = rstr[:-3]\n",
    "        r = re.compile(rstr)\n",
    "        rsubstr = r'Or('\n",
    "        for m in range(1, 1+1+consec_or):\n",
    "            rsubstr += '\\\\' + str(m) + ', '\n",
    "        rsubstr = rsubstr[:-2] + ')'\n",
    "        # logic_str = r.sub(r\n",
    "        logic_str = r.sub(rsubstr, logic_str)\n",
    "        # print(rsubstr)\n",
    "    # print(consec_or)\n",
    "    # Replace conjunction (∧) with And\n",
    "    # print(logic_str)\n",
    "    r = re.compile(\"¬\\(([^ ]*\\([^\\(]*\\)) ∨ ([^ ]*\\([^\\(^)]*\\))\\)\")\n",
    "    logic_str = r.sub(r\"Not(Or(\\1, \\2))\", logic_str)\n",
    "    \n",
    "    r = re.compile(\"([^ ]*\\([^\\(]*\\)) ∨ ([^ ]*\\([^\\(]*\\))\")\n",
    "\n",
    "    logic_str = r.sub(r\"Or(\\1, \\2)\", logic_str)    \n",
    "\n",
    "    r = re.compile(\"¬\\(([^ ]*\\([^\\(]*\\)) ∧ ([^ ]*\\([^\\(^)]*\\))\\)\")\n",
    "    logic_str = r.sub(r\"Not(And(\\1, \\2))\", logic_str)\n",
    "    \n",
    "    r = re.compile(\"([^ ]*\\([^\\(]*\\)) ∧ ([^ ]*\\([^\\(]*\\))\")\n",
    "    logic_str = r.sub(r\"And(\\1, \\2)\", logic_str).replace('And ', 'And')\n",
    "\n",
    "    \n",
    "    r = re.compile(\"¬\\(([^ ]*\\([^\\(]*\\)) ⊕ ([^ ]*\\([^\\(^)]*\\))\\)\")\n",
    "    logic_str = r.sub(r\"Not(Xor(\\1, \\2))\", logic_str)\n",
    "\n",
    "    r = re.compile(\"^(Not\\([^ ]*\\([^\\(]*\\)\\)) ⊕ (Not\\([^ ]*\\([^\\(^)]*\\)\\))$\")\n",
    "    logic_str = r.sub(r\"Xor(\\1, \\2)\", logic_str)\n",
    "    \n",
    "    r = re.compile(\"^(Not\\([^ ]*\\([^\\(]*\\)\\)) ⊕ ([^ ]*\\([^\\(^)]*\\))$\")\n",
    "    logic_str = r.sub(r\"Xor(\\1, \\2)\", logic_str)\n",
    "\n",
    "    \n",
    "    r = re.compile(\"^([^ ]*\\([^\\(]*\\)) ⊕ (Not\\([^ ]*\\([^\\(^)]*\\)\\))$\")\n",
    "    logic_str = r.sub(r\"Xor(\\1, \\2)\", logic_str)\n",
    "\n",
    "    r = re.compile(\"^([^ ]*\\([^\\(]*\\)) ⊕ ([^ ]*\\([^\\(^)]*\\))$\")\n",
    "    logic_str = r.sub(r\"Xor(\\1, \\2)\", logic_str)\n",
    "\n",
    "    r = re.compile(\"→ ([^ ]*\\([^\\(]*\\)) ⊕ ([^ ]*\\([^\\(^)]*\\))$\")\n",
    "    logic_str = r.sub(r\"→ Xor(\\1, \\2)\", logic_str)\n",
    "    \n",
    "    r = re.compile(\"\\(([^ ]*\\([^\\(]*\\)) ⊕ ([^ ]*\\([^\\(^)]*\\))\\)\")\n",
    "    logic_str = r.sub(r\"Xor(\\1, \\2)\", logic_str)\n",
    "\n",
    "    # r = re.compile(\"¬\\((.*)\\)\")\n",
    "\n",
    "    # logic_str = r.sub(r\"Not(\\1)\", logic_str)\n",
    "\n",
    "    r = re.compile(\"(.*)→(.*)\")\n",
    "    logic_str = r.sub(r\"Implies(\\1, \\2)\", logic_str).replace(' ,', ',').replace('  ', ' ')\n",
    "    \n",
    "    # logic_str = re.sub(r\"∀x\", \"ForAll([x],\", logic_str)\n",
    "    \n",
    "    # Replace implication (→) with Implies\n",
    "    \n",
    "    \n",
    "    # Replace negation (¬) with Not\n",
    "\n",
    "    \n",
    "    \n",
    "    # Replace disjunction (∨) with Or\n",
    "  \n",
    "    # Make predicates lowercase for consistency\n",
    "    # logic_str = re.sub(r\"\\b(Eel|Fish|Tree|DisplayedIn|Plant|LivingCreature|ComplexCell|Bacteria|Animal|Multicellular|ShownIn|seaSnake|seaEel)\\b\", lambda m: m.group(0).lower(), logic_str)\n",
    "    old_logic_str = logic_str\n",
    "    r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "    logic_str = r.sub(r\"\\1\\2_\\3\\4\", logic_str)\n",
    " \n",
    "    while old_logic_str != logic_str:\n",
    "        old_logic_str = logic_str\n",
    "        r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "        logic_str = r.sub(r\"\\1\\2_\\3\\4\", logic_str)\n",
    "        \n",
    "\n",
    "    \n",
    "    # Handle cases where functions or predicates are followed by variables\n",
    "    logic_str = re.sub(r\"([a-zA-Z]+)\\((\\w+)\\)\", r\"\\1(\\2)\", logic_str)\n",
    "    if len(const) != 0:\n",
    "        new_str = 'ForAll(['\n",
    "        for c in const:\n",
    "            new_str += c + ','\n",
    "        logic_str = new_str[:-1] + '], ' + logic_str + ')'\n",
    "    # if 'Implies' in logic_str:\n",
    "        # logic_str = logic_str.replace('Implies(', 'Implies')[:-1]\n",
    "    return logic_str.replace('( ', '(').replace(' (', '(')\n",
    "def extract_predicates_and_objects(logic_str):\n",
    "    # Regex to match predicates and objects inside parentheses\n",
    "    predicate_pattern = r\"([a-zA-Z]+)\\(([^)]+)\\)\"\n",
    "    \n",
    "    # Find all matches\n",
    "    matches = re.findall(predicate_pattern, logic_str)\n",
    "    \n",
    "    extracted = []\n",
    "    \n",
    "    # Process the matches to separate predicate and objects\n",
    "    for predicate, objects in matches:\n",
    "        object_list = objects.split(\",\")  # Split objects by comma if there are multiple\n",
    "        extracted.append((predicate, object_list))\n",
    "    \n",
    "    return extracted\n",
    "\n",
    "\n",
    "# for d in ds:\n",
    "#     if d['example_id'] == 1337:\n",
    "#         logic_statements = d['premises-FOL'].split('\\n') + [d['conclusion-FOL']]\n",
    "#         for z in d['premises-FOL'].split('\\n'):\n",
    "#             print(z)\n",
    "d = ds[499]\n",
    "logic_statements = d['premises-FOL'].split('\\n') + [d['conclusion-FOL']]\n",
    "space_ops = ['∧', '⊕', '∨']\n",
    "\n",
    "for s in range(len(logic_statements)):\n",
    "    logic_statements[s] = logic_statements[s].replace('  ', ' ')\n",
    "    statement = logic_statements[s]\n",
    "    c = 0\n",
    "    while c < (len(logic_statements[s])):\n",
    "        # print(logic_statements[s])\n",
    "        # if namecounter == 1:\n",
    "        #     breakpoint()\n",
    "        if logic_statements[s][c] in space_ops:\n",
    "            # breakpoint()\n",
    "            if logic_statements[s][c-1] != ' ':\n",
    "                logic_statements[s] = logic_statements[s][:c] + ' ' + logic_statements[s][c:]\n",
    "                # breakpoint()\n",
    "            if logic_statements[s][c+1] != ' ':\n",
    "                logic_statements[s] = logic_statements[s][:c+2] + ' ' + logic_statements[s][c+2:]\n",
    "                # breakpoint()\n",
    "        c += 1\n",
    "for statement in logic_statements:\n",
    "    print(statement)\n",
    "print('--------------')\n",
    "predicates = []\n",
    "entities = []\n",
    "arity = {}\n",
    "# print(logic_statements)\n",
    "# logic_statements.append('∀x (DisplayedIn(x, collection) → ¬(Plant(x) ⊕ LivingCreature(x)))')\n",
    "\n",
    "\n",
    "    # print(\"-\" * 50)\n",
    "# print(entities, predicates)\n",
    "const = []\n",
    "\n",
    "\n",
    "            \n",
    "# print(const)\n",
    "\n",
    "converted_statements = [convert_to_target_format(statement) for statement in logic_statements]\n",
    "for statement in converted_statements:\n",
    "    if 'ForAll' in statement:\n",
    "        consts = statement.split('ForAll([')[1].split(']')[0].split(',')\n",
    "        # print('yeah')\n",
    "        for c in consts:\n",
    "            if c not in const: const.append(c)\n",
    "# print(const)\n",
    "for statement in logic_statements:\n",
    "    extracted = extract_predicates_and_objects(statement)\n",
    "    # print(extracted)\n",
    "    # print(f\"Logic Statement: {statement}\")\n",
    "    for predicate, objects in extracted:\n",
    "        old_logic_str = predicate\n",
    "        r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "        logic_str = r.sub(r\"\\1\\2_\\3\\4\", predicate)\n",
    "        while old_logic_str != logic_str:\n",
    "            old_logic_str = logic_str\n",
    "            r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "            logic_str = r.sub(r\"\\1\\2_\\3\\4\", logic_str)\n",
    "            logic_str = logic_str\n",
    "        logic_str = logic_str.lower().strip(' ')\n",
    "\n",
    "        if logic_str not in predicates:\n",
    "            predicates.append(logic_str)\n",
    "            arity[logic_str] = len(objects)\n",
    "        # print(f\"Predicate: {predicate}, Objects: {objects}\")\n",
    "        for o in objects:\n",
    "            # print(o)\n",
    "            old_logic_str = o\n",
    "            r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "            logic_str = r.sub(r\"\\1\\2_\\3\\4\", o)\n",
    "            while old_logic_str != logic_str:\n",
    "                old_logic_str = logic_str\n",
    "                r = re.compile(\"(.*)([a-z])([A-Z])(.*)\")\n",
    "                logic_str = r.sub(r\"\\1\\2_\\3\\4\", logic_str)\n",
    "            logic_str = logic_str.lower().strip(' ')\n",
    "            if o in const:continue\n",
    "            if logic_str not in entities:\n",
    "                entities.append(logic_str)\n",
    "    \n",
    "# Print the converted statements\n",
    "print(const, entities, predicates)\n",
    "\n",
    "for i in range(len(converted_statements)):\n",
    "    converted_statements[i] = converted_statements[i].lower().replace('implies(', 'Implies(').replace('not(', 'Not(').replace('or(', 'Or(').replace('xor(', 'Xor(').replace('xOr', 'Xor').replace('forall(', 'ForAll(').replace('and(', 'And(')\n",
    "\n",
    "for statement in converted_statements:\n",
    "    print(statement)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "89df44c0-1d14-4a40-b793-e8801983ee22",
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'consec_and' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[3], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mconsec_and\u001b[49m\n",
      "\u001b[0;31mNameError\u001b[0m: name 'consec_and' is not defined"
     ]
    }
   ],
   "source": [
    "consec_and"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 338,
   "id": "fca06cf6-084b-4324-a249-10964d7194f1",
   "metadata": {},
   "outputs": [
    {
     "ename": "AttributeError",
     "evalue": "module 'ast' has no attribute 'unparse'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[338], line 2\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mast\u001b[39;00m\n\u001b[0;32m----> 2\u001b[0m \u001b[38;5;28mprint\u001b[39m(\u001b[43mast\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43munparse\u001b[49m(ast\u001b[38;5;241m.\u001b[39mparse(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mImplies(Xor((Not(want_to_be_addicted_to_caffeine(rina)), Not(aware_that_drug(rina, caffeine)))), Not(And(Not(want_to_be_addicted_to(rina, caffeine)), drink_regularly(rina, coffee))))\u001b[39m\u001b[38;5;124m'\u001b[39m)))\n",
      "\u001b[0;31mAttributeError\u001b[0m: module 'ast' has no attribute 'unparse'"
     ]
    }
   ],
   "source": [
    "import ast\n",
    "print(ast.unparse(ast.parse('Implies(Xor((Not(want_to_be_addicted_to_caffeine(rina)), Not(aware_that_drug(rina, caffeine)))), Not(And(Not(want_to_be_addicted_to(rina, caffeine)), drink_regularly(rina, coffee))))')))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 340,
   "id": "e694d9a9-d34f-495d-81aa-f962cd4e0693",
   "metadata": {},
   "outputs": [],
   "source": [
    "import astunparse"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 341,
   "id": "20f15ce4-211e-45db-aa38-7f4a2064e07a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Implies(Xor((Not(want_to_be_addicted_to_caffeine(rina)), Not(aware_that_drug(rina, caffeine)))), Not(And(Not(want_to_be_addicted_to(rina, caffeine)), drink_regularly(rina, coffee))))\n",
      "\n"
     ]
    }
   ],
   "source": [
    "print(astunparse.unparse(ast.parse('Implies(Xor((Not(want_to_be_addicted_to_caffeine(rina)), Not(aware_that_drug(rina, caffeine)))), Not(And(Not(want_to_be_addicted_to(rina, caffeine)), drink_regularly(rina, coffee))))')))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 291,
   "id": "01b6b80a-b7c0-4f13-a69a-31ee880757e9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "from z3 import *\n",
      "ThingsSort, (collection, sea_snake, sea_eel) = EnumSort('ThingsSort', ['collection', 'sea_snake', 'sea_eel'])\n",
      "eel = Function('eel', ThingsSort, BoolSort())\n",
      "fish = Function('fish', ThingsSort, BoolSort())\n",
      "tree = Function('tree', ThingsSort, BoolSort())\n",
      "displayed_in = Function('displayed_in', ThingsSort, ThingsSort, BoolSort())\n",
      "plant = Function('plant', ThingsSort, BoolSort())\n",
      "living_creature = Function('living_creature', ThingsSort, BoolSort())\n",
      "complex_cell = Function('complex_cell', ThingsSort, BoolSort())\n",
      "bacteria = Function('bacteria', ThingsSort, BoolSort())\n",
      "animal = Function('animal', ThingsSort, BoolSort())\n",
      "multicellular = Function('multicellular', ThingsSort, BoolSort())\n",
      "shown_in = Function('shown_in', ThingsSort, ThingsSort, BoolSort())\n",
      "x = Const('x', ThingsSort)\n",
      "precond=[]\n",
      "precond.append(ForAll([x], Implies(eel(x), fish(x))))\n",
      "precond.append(ForAll([x], Implies(fish(x), Not(tree(x)))))\n",
      "precond.append(ForAll([x], Implies(displayed_in(x, collection), Xor(plant(x), living_creature(x)))))\n",
      "precond.append(ForAll([x], Implies(complex_cell(x), Not(bacteria(x)))))\n",
      "precond.append(ForAll([x], Implies(And(displayed_in(x, collection), animal(x)), multicellular(x))))\n",
      "precond.append(shown_in(sea_snake, collection))\n",
      "precond.append(Or(eel(sea_snake), Or(living_creature(sea_snake)), Not(plant(sea_eel))))\n",
      "precond.append(bacteria(sea_eel))\n",
      "s = Solver()\n",
      "s.add(precond)\n",
      "s.add(Not(ForAll([x], Implies(displayed_in(x, collection), Not(Xor(plant(x), living_creature(x)))))))\n",
      "if s.check() == unsat:\n",
      "    print('True')\n",
      "else:\n",
      "    print('False')\n"
     ]
    }
   ],
   "source": [
    "file_str = ''\n",
    "file_str += 'from z3 import *\\n'\n",
    "file_str += 'ThingsSort, (' \n",
    "for e in entities:\n",
    "    file_str += e + ', '\n",
    "file_str = file_str[:-2]\n",
    "file_str += ') = EnumSort(\\'ThingsSort\\', ['\n",
    "for e in entities:\n",
    "    file_str += '\\'' + e + '\\', '\n",
    "file_str = file_str[:-2] + '])\\n'\n",
    "for p in predicates:\n",
    "    file_str += p + ' = Function(\\'' + p + '\\', '\n",
    "    for r in range(arity[p]):\n",
    "        file_str += 'ThingsSort, '\n",
    "    file_str += 'BoolSort())\\n'\n",
    "# print(file_str)\n",
    "for c in const:\n",
    "    file_str += c + ', '\n",
    "if len(const) == 1:\n",
    "    file_str = file_str[:-2] + ' = Const(\\''\n",
    "else:\n",
    "    file_str = file_str[:-2] + ' = Consts(\\''\n",
    "\n",
    "for c in const:\n",
    "    file_str += c + ' '\n",
    "file_str = file_str[:-1] + '\\', ThingsSort)\\nprecond=[]\\n'\n",
    "\n",
    "for statement in converted_statements[:-1]:\n",
    "    file_str += 'precond.append(' + statement + ')\\n'\n",
    "\n",
    "file_str += 's = Solver()\\ns.add(precond)\\n'\n",
    "file_str += 's.add(Not(' + converted_statements[-1] + '))\\n'\n",
    "file_str += 'if s.check() == unsat:\\n    print(\\'True\\')\\nelse:\\n    print(\\'False\\')'\n",
    "print(file_str)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 257,
   "id": "c028debc-92f7-403e-a998-9dbd65c9b2d0",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'hello'"
      ]
     },
     "execution_count": 257,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "'Hello'.lower()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 246,
   "id": "61541adc-5392-43e7-b0de-4b21780496e7",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['∀x (Eel(x) → Fish(x))', '∀x (Fish(x) → ¬Tree(x))', '∀x (DisplayedIn(x, collection) → Plant(x) ⊕ LivingCreature(x))', '∀x (ComplexCell(x) → ¬Bacteria(x))', '∀x (DisplayedIn(x, collection) ∧ Animal(x) → Multicellular(x))', 'ShownIn(seaSnake, collection)', 'eel(seaSnake) ∨ LivingCreature(seaSnake) ∨ ¬Plant(seaEel)', '∀x (DisplayedIn(x, collection) → ¬(Plant(x) ⊕ LivingCreature(x)))']\n"
     ]
    }
   ],
   "source": [
    "print(logic_statements)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 230,
   "id": "5b3a4ea6-3c5e-4169-b791-e9fc6c63528b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Logic Statement: ∀x (Eel(x) → Fish(x))\n",
      "Predicate: Eel, Objects: ['x']\n",
      "Predicate: Fish, Objects: ['x']\n",
      "--------------------------------------------------\n",
      "Logic Statement: ∀x (Fish(x) → ¬Tree(x))\n",
      "Predicate: Fish, Objects: ['x']\n",
      "Predicate: Tree, Objects: ['x']\n",
      "--------------------------------------------------\n",
      "Logic Statement: ∀x (DisplayedIn(x, collection) → Plant(x) ⊕ LivingCreature(x))\n",
      "Predicate: DisplayedIn, Objects: ['x', ' collection']\n",
      "Predicate: Plant, Objects: ['x']\n",
      "Predicate: LivingCreature, Objects: ['x']\n",
      "--------------------------------------------------\n",
      "Logic Statement: ∀x (ComplexCell(x) → ¬Bacteria(x))\n",
      "Predicate: ComplexCell, Objects: ['x']\n",
      "Predicate: Bacteria, Objects: ['x']\n",
      "--------------------------------------------------\n",
      "Logic Statement: ∀x (DisplayedIn(x, collection) ∧ Animal(x) → Multicellular(x))\n",
      "Predicate: DisplayedIn, Objects: ['x', ' collection']\n",
      "Predicate: Animal, Objects: ['x']\n",
      "Predicate: Multicellular, Objects: ['x']\n",
      "--------------------------------------------------\n",
      "Logic Statement: ShownIn(seaSnake, collection)\n",
      "Predicate: ShownIn, Objects: ['seaSnake', ' collection']\n",
      "--------------------------------------------------\n",
      "Logic Statement: eel(seaSnake) ∨ LivingCreature(seaSnake) ∨ ¬Plant(seaEel)\n",
      "Predicate: eel, Objects: ['seaSnake']\n",
      "Predicate: LivingCreature, Objects: ['seaSnake']\n",
      "Predicate: Plant, Objects: ['seaEel']\n",
      "--------------------------------------------------\n"
     ]
    }
   ],
   "source": [
    "import re\n",
    "\n",
    "def extract_predicates_and_objects(logic_str):\n",
    "    # Regex to match predicates and objects inside parentheses\n",
    "    predicate_pattern = r\"([a-zA-Z]+)\\(([^)]+)\\)\"\n",
    "    \n",
    "    # Find all matches\n",
    "    matches = re.findall(predicate_pattern, logic_str)\n",
    "    \n",
    "    extracted = []\n",
    "    \n",
    "    # Process the matches to separate predicate and objects\n",
    "    for predicate, objects in matches:\n",
    "        object_list = objects.split(\",\")  # Split objects by comma if there are multiple\n",
    "        extracted.append((predicate, object_list))\n",
    "    \n",
    "    return extracted\n",
    "\n",
    "# List of input first-order logic statements\n",
    "\n",
    "# Extract predicates and objects for each logic statement\n",
    "for statement in logic_statements:\n",
    "    extracted = extract_predicates_and_objects(statement)\n",
    "    print(f\"Logic Statement: {statement}\")\n",
    "    for predicate, objects in extracted:\n",
    "        print(f\"Predicate: {predicate}, Objects: {objects}\")\n",
    "    print(\"-\" * 50)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "id": "e4e748ac-75e7-4886-add6-19a7a687b005",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['x']\n",
      "['x']\n",
      "['x']\n",
      "[]\n",
      "[]\n"
     ]
    }
   ],
   "source": [
    "for line in ds[0]['premises-FOL'].split('\\n'):\n",
    "    const = []\n",
    "    \n",
    "    if '∀' in line:\n",
    "        for z in line.split('∀'):\n",
    "            if len(z) == 0: continue\n",
    "            # print(z[0])\n",
    "            if z[0] not in const:\n",
    "                const.append(z[0])\n",
    "    # print(const)\n",
    "    for z in line.split('('):\n",
    "        if "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "id": "1e150f22-3224-4fda-95d0-95e4be70c926",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "All people who regularly drink coffee are dependent on caffeine.\n",
      "People regularly drink coffee, or they don't want to be dependent to caffeine, or both.\n",
      "No one who doesn't want to be addicted to caffeine is unaware that caffeine is a drug.\n",
      "Rina is either a scholar who is unconcious that caffeine is a drug, or she is not a student and is she aware that caffeine is a drug.\n",
      "Rina is either a student who is dependent on caffeine, or she is not a scholar and not dependent on caffeine.\n"
     ]
    }
   ],
   "source": [
    "vars =[]\n",
    "funcs = []\n",
    "for line in ds[0]['premises'].split('\\n'):\n",
    "    print(line)\n",
    "            \n",
    "    \n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 152,
   "id": "16838fec-e0f5-493e-bbb2-8266dc84612c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ah hah\n",
      "∀x (Eel(x) → Fish(x))\n",
      "∀x (Fish(x) → ¬Tree(x))\n",
      "∀x (DisplayedIn(x, collection) → Plant(x) ⊕ LivingCreature(x))\n",
      "∀x (ComplexCell(x) → ¬Bacteria(x))\n",
      "∀x (DisplayedIn(x, collection) ∧ Animal(x) → Multicellular(x))\n",
      "ShownIn(seaSnake, collection)\n",
      "eel(seaSnake) ∨ LivingCreature(seaSnake) ∨ ¬Plant(seaEel)\n"
     ]
    }
   ],
   "source": [
    "for d in ds:\n",
    "    if d['example_id'] == 1337:\n",
    "        print('ah hah')\n",
    "        for z in d['premises-FOL'].split('\\n'):\n",
    "            print(z)\n",
    "    # break"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "LLM",
   "language": "python",
   "name": "llm"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.19"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
