{
  "cells": [
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "bqKC4FiNjjLf"
      },
      "source": [
        "# Proof-Carrying Numbers (PCN): A Protocol for Trustworthy Numeric Answers from LLMs via Claim Verification"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 39,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "hdjdN5tRcepf",
        "outputId": "71f61fea-f419-4d1a-a4f6-1c34333ecff2"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "I am sorry, but based on the data provided, I cannot provide the GDP of India in 2020. The data only contains information about the Philippines. The GDP of the Philippines in 2020 was <claim id=\"830f\" policy=\"exact\">361,751,145,451.597</claim> USD.\n",
            "\n"
          ]
        }
      ],
      "source": [
        "from google.colab import ai\n",
        "\n",
        "SYSTEM_PROMPT = \"\"\"You are a helpful assistant that uses the context given to you to answer the user's question.\n",
        "\n",
        "**Answer Format**:\n",
        "  - When you provide any numerical data or values obtained from the context, **YOU MUST ALWAYS** enclose the numbers within a claim tag in the following format: `<claim id=\"claim_id\" policy=\"policy\">\"value\"</claim>`. For example, \"The GDP of the Philippines in 2020 is <claim id=\"5e1f\" policy=\"auto\">361,751,145,451.597</claim> USD\". THIS IS MANDATORY.\n",
        "  - Never invent a claim id. Always make sure that a claim id is in the data provided in the context.\n",
        "  - You may simplify the data provided in the context to make it more readable using some policy, but you must always make sure that a claim id is in the generated text wrapped in a claim tag.\n",
        "  - Always use `policy=\"exact\"`.\n",
        "\"\"\"\n",
        "\n",
        "\n",
        "PCN_DATA = {\n",
        "  \"data\": [\n",
        "    {\n",
        "      \"indicator_id\": \"WB_WDI_NY_GDP_MKTP_CD\",\n",
        "      \"indicator_name\": \"GDP (current US$)\",\n",
        "      \"data\": [\n",
        "        {\n",
        "          \"country\": \"Philippines\",\n",
        "          \"date\": \"2024\",\n",
        "          \"value\": 461617509782.355,\n",
        "          \"claim_id\": \"ad3f\"\n",
        "        },\n",
        "        {\n",
        "          \"country\": \"Philippines\",\n",
        "          \"date\": \"2023\",\n",
        "          \"value\": 437055627244.424,\n",
        "          \"claim_id\": \"4782\"\n",
        "        },\n",
        "        {\n",
        "          \"country\": \"Philippines\",\n",
        "          \"date\": \"2022\",\n",
        "          \"value\": 404353369604.631,\n",
        "          \"claim_id\": \"5180\"\n",
        "        },\n",
        "        {\n",
        "          \"country\": \"Philippines\",\n",
        "          \"date\": \"2021\",\n",
        "          \"value\": 394087359848.11,\n",
        "          \"claim_id\": \"6584\"\n",
        "        },\n",
        "        {\n",
        "          \"country\": \"Philippines\",\n",
        "          \"date\": \"2020\",\n",
        "          \"value\": 361751145451.597,\n",
        "          \"claim_id\": \"830f\"\n",
        "        }\n",
        "      ]\n",
        "    }\n",
        "  ],\n",
        "  \"note\": {\n",
        "    \"WB_WDI_NY_GDP_MKTP_CD\": \"\"\n",
        "  }\n",
        "}\n",
        "\n",
        "\n",
        "PCN_CONTEXT = f\"\"\"Context: {PCN_DATA}\"\"\"\n",
        "\n",
        "# PROMPT = \"What is the capital of France?\"\n",
        "PROMPT = \"What is the GDP of the Philippines in 2020?\"\n",
        "PROMPT = \"What is the GDP of the India in 2020?\"\n",
        "\n",
        "\n",
        "response = ai.generate_text(\"\\n\\n\".join([SYSTEM_PROMPT, PCN_CONTEXT, PROMPT]))\n",
        "print(response)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "l6DSUhr7i9hE"
      },
      "source": [
        "# Simulating the presentation layer"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "o4EiMF7BeP08"
      },
      "outputs": [],
      "source": [
        "import re\n",
        "from bs4 import BeautifulSoup\n",
        "\n",
        "cleaned_pattern = re.compile(r\"[^\\d.]\")   # keep only digits and dot\n",
        "\n",
        "\n",
        "def get_claims(data):\n",
        "    claims = {\n",
        "        k[\"claim_id\"]: k for k in data[\"data\"]\n",
        "    }\n",
        "\n",
        "    return claims\n",
        "\n",
        "\n",
        "def pcn_validation(response, claims):\n",
        "    soup = BeautifulSoup(response, \"html.parser\")\n",
        "\n",
        "    claim_tags = soup.find_all(\"claim\")\n",
        "\n",
        "    for claim in claim_tags:\n",
        "        claim_id = claim.get(\"id\")\n",
        "        policy = claim.get(\"policy\")\n",
        "\n",
        "        if claim_id is None or policy is None:\n",
        "            continue\n",
        "        if claim_id not in claims:\n",
        "            continue\n",
        "\n",
        "        # default to warning unless we prove exact match\n",
        "        badge = soup.new_tag(\"sup\")\n",
        "\n",
        "        if policy == \"exact\":\n",
        "            generated = float(cleaned_pattern.sub(\"\", claim.get_text(strip=True)))\n",
        "            expected = float(claims[claim_id].get(\"value\", \"\"))\n",
        "\n",
        "            print(generated, expected)\n",
        "            if generated == expected:\n",
        "                badge.string = \"✅\"\n",
        "            else:\n",
        "                badge.string = \"⚠️\"\n",
        "        else:\n",
        "            badge.string = \"⚠️\"\n",
        "\n",
        "        # put the badge inside the <claim>\n",
        "        claim.append(badge)\n",
        "\n",
        "    return soup"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 43,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 55
        },
        "id": "Q0q2lvmtcgpD",
        "outputId": "0c18d56d-f6e9-4777-a43b-244cb3e9a2a7"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "361751145451.597 361751145451.597\n"
          ]
        },
        {
          "data": {
            "text/html": [
              "I am sorry, but based on the data provided, I cannot provide the GDP of India in 2020. The data only contains information about the Philippines. The GDP of the Philippines in 2020 was <claim id=\"830f\" policy=\"exact\">361,751,145,451.597<sup>✅</sup></claim> USD.\n"
            ],
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        }
      ],
      "source": [
        "from IPython.display import HTML\n",
        "\n",
        "\n",
        "claims = get_claims(PCN_DATA[\"data\"][0])\n",
        "soup = pcn_validation(response, claims)\n",
        "\n",
        "html_code = f\"\"\"{soup}\"\"\"\n",
        "\n",
        "display(HTML(html_code))"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "6WOk0hLicgmv"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "31fKmEICcgkV"
      },
      "outputs": [],
      "source": []
    }
  ],
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}
