{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# NL → JQL Query Generation (Anonymized)\n",
    "This supplemental notebook shows schema handling, prompt templates, and JSON parsing utilities.  \n",
    "All provider-specific calls and API references have been removed for anonymous review.  \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Notebook: NL to JQL Query Generation\n",
    "\n",
    "import json\n",
    "import pandas as pd\n",
    "from pathlib import Path\n",
    "from tqdm import tqdm\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# ------------------------\n",
    "# Load Jira Compact Schema\n",
    "# ------------------------\n",
    "with open(\"fields/jira_compact_schema.json\") as f:\n",
    "    JIRA_SCHEMA = json.load(f)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# [Removed for anonymous review]\n",
    "# This cell referenced LLM providers and/or secrets (.env/API keys).\n",
    "# The supplemental artifact excludes provider-specific code.\n",
    "# If needed, replace with your own stub or offline baseline."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "RESPONSE_FORMAT = {\n",
    "    \"type\": \"json_schema\",\n",
    "    \"json_schema\": {\n",
    "        \"name\": \"jql_generation\",\n",
    "        \"schema\": {\n",
    "            \"type\": \"object\",\n",
    "            \"properties\": {\"jql\": {\"type\": \"string\"}},\n",
    "            \"required\": [\"jql\"],\n",
    "        },\n",
    "    },\n",
    "}\n",
    "\n",
    "INPUT_FILES = [\n",
    "    \"output/user_questions/5k_long_nl.jsonl\",\n",
    "    \"output/user_questions/5k_semantically_exact.jsonl\",\n",
    "    \"output/user_questions/5k_semantically_similar.jsonl\",\n",
    "    \"output/user_questions/5k_short_nl.jsonl\",\n",
    "]\n",
    "\n",
    "OUTPUT_DIR = Path(\"save_results/\")\n",
    "OUTPUT_DIR.mkdir(parents=True, exist_ok=True)\n",
    "\n",
    "# ------------------------\n",
    "# Prompt Template\n",
    "# ------------------------\n",
    "\n",
    "PROMPT_TEMPLATE_with_schema = \"\"\"\n",
    "Given the following natural language description of a Jira search query, \n",
    "generate the corresponding valid JQL (Jira Query Language) query.\n",
    "Use only fields from the SCHEMA below (`jqlName` as the field key).\n",
    "\n",
    "SCHEMA:\n",
    "{schema}\n",
    "\n",
    "Natural language:\n",
    "\"{natural_language}\"\n",
    "\n",
    "Output only valid JSON in this format:\n",
    "{{\n",
    "  \"jql\": \"<the generated JQL query>\"\n",
    "}}\n",
    "\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# RUN LLMS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# [Removed for anonymous review]\n",
    "# This cell referenced LLM providers and/or secrets (.env/API keys).\n",
    "# The supplemental artifact excludes provider-specific code.\n",
    "# If needed, replace with your own stub or offline baseline."
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "name": "python3"
  },
  "language_info": {
   "name": "python",
   "pygments_lexer": "ipython3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
